Sh4dow's Blog

活了二十几年,从来没有人给过我一次意外感动或惊喜,也没有人在我生日的时候给过我特别的礼物,生病的时候得到的只是一些不在身边的语言安慰,也不见谁真正的照顾过自己,甚至有的时候自己蒙头睡一觉就好了,也有人喜欢过我,但是从没见谁坚持过。

python获取QQ企业邮箱通讯录

---------------

#!/usr/bin/env python

# -*- coding: utf-8 -*-

# @Last Modified time: 2016-03-03 22:45:18

# @Description: 获取腾讯企业邮箱通讯录

import requests

import re

import rsa

import sys

import base64

import time

import argparse

reload(sys)


sys.setdefaultencoding('utf8')



# 打印部门人员信息

def print_tree(id, department_infos, level, staff_infors, f):

    prefix = '----' * level

    text = prefix + department_infos[id]['name'] + prefix

    print text

    f.write(text + '\n')

    for key, value in department_infos.items():

        if value['pid'] == id:

            print_tree(

                value['id'], department_infos, level + 1, staff_infors, f)

    prefix = '    ' * level

    for staff in staff_infors:

        if staff['pid'] == id:

            text = prefix + staff['name'] + '  ' + staff['alias']

            print text

            f.write(text + '\n')



# 提取RSA算法的公钥

def get_public_key(content):

    regexp = r'var\s*PublicKey\s*=\s*"(\w+?)";'

    results = re.findall(regexp, content)

    if results:

        return results[0]



# 获取ts参数

def get_ts(content):

    regexp = r'PublicTs\s*=\s*"([0-9]+)"'

    results = re.findall(regexp, content)

    if results:

        return results[0]



# 计算p参数

def get_p(public_key, password, ts):

    public_key = rsa.PublicKey(int(public_key, 16), 65537)

    res_tmp = rsa.encrypt(

        '{password}\n{ts}\n'.format(password=password, ts=ts), public_key)

    return base64.b64encode(res_tmp)



def msg():

    return 'python get_tencent_exmail_contacts.py -u name@domain.com -p passw0rd'


if __name__ == "__main__":

    description = "获取腾讯企业邮箱通讯录"

    parser = argparse.ArgumentParser(description=description, usage=msg())

    parser.add_argument(

        "-u", "--email", required=True, dest="email", help="邮箱名")

    parser.add_argument(

        "-p", "--password", required=True, dest="password", help="邮箱密码")

    parser.add_argument(

        "-l", "--limit", required=False, dest="limit", default=10000, help="通讯录条数")

    parser.add_argument(

        "-e", "--efile", required=False, dest="emailfile", default="emails.txt", help="邮箱保存文件")

    parser.add_argument(

        "-d", "--dfile", required=False, dest="departfile", default="departments.txt", help="部门信息保存文件")

    args = parser.parse_args()

    email = args.email

    password = args.password

    limit = args.limit

    emailfile = args.emailfile

    departfile = args.departfile

    session = requests.Session()


    headers = {'Connection': 'keep-alive',

               'Cache-Control': 'max-age=0',

               'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',

               'Upgrade-Insecure-Requests': 1,

               'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_11_2) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/48.0.2564.116 Safari/537.36',

               'DNT': 1,

               'Accept-Encoding': 'gzip, deflate, sdch',

               'Accept-Language': 'zh-CN,zh;q=0.8,en-US;q=0.6,en;q=0.4',

               }

    resp = session.get('http://exmail.qq.com/login', headers=headers)

    content = resp.content


    public_key = get_public_key(content)


    ts = get_ts(content)


    p = get_p(public_key, password, ts)


    # print ts

    # print public_key

    # print p


    uin = email.split('@')[0]

    domain = email.split('@')[1]

    # print uin

    # print domain


    post_data = {}

    post_data['sid'] = ''

    post_data['firstlogin'] = False

    post_data['domain'] = domain

    post_data['aliastype'] = 'other'

    post_data['errtemplate'] = 'dm_loginpage'

    post_data['first_step'] = ''

    post_data['buy_amount'] = ''

    post_data['year'] = ''

    post_data['company_name'] = ''

    post_data['is_get_dp_coupon'] = ''

    post_data['starttime'] = int(time.time() * 1000)

    post_data['redirecturl'] = ''

    post_data['f'] = 'biz'

    post_data['uin'] = uin

    post_data['p'] = p

    post_data['delegate_url'] = ''

    post_data['ts'] = ts

    post_data['from'] = ''

    post_data['ppp'] = ''

    post_data['chg'] = 0

    post_data['loginentry'] = 3

    post_data['s'] = ''

    post_data['dmtype'] = 'bizmail'

    post_data['fun'] = ''

    post_data['inputuin'] = email

    post_data['verifycode'] = ''


    headers = {'Content-Type': 'application/x-www-form-urlencoded'}

    url = 'https://exmail.qq.com/cgi-bin/login'

    resp = session.post(url, headers=headers, data=post_data)


    regexp = r'sid=(.*?)"'


    sid = re.findall(regexp, resp.content)[0]

    url = 'http://exmail.qq.com/cgi-bin/laddr_biz?action=show_party_list&sid={sid}&t=contact&view=biz'

    resp = session.get(url.format(sid=sid))


    text = resp.text

    regexp = r'{id:"(\S*?)", pid:"(\S*?)", name:"(\S*?)", order:"(\S*?)"}'

    results = re.findall(regexp, text)

    department_ids = []

    department_infor = dict()

    root_department = None

    for item in results:

        department_ids.append(item[0])

        department = dict(id=item[0], pid=item[1], name=item[2], order=item[3])

        department_infor[item[0]] = department

        if item[1] == 0 or item[1] == '0':

            root_department = department


    regexp = r'{uin:"(\S*?)",pid:"(\S*?)",name:"(\S*?)",alias:"(\S*?)",sex:"(\S*?)",pos:"(\S*?)",tel:"(\S*?)",birth:"(\S*?)",slave_alias:"(\S*?)",department:"(\S*?)",mobile:"(\S*?)"}'


    all_emails = []

    staff_infors = []

    for department_id in department_ids:

        url = 'http://exmail.qq.com/cgi-bin/laddr_biz?t=memtree&limit={limit}&partyid={partyid}&action=show_party&sid={sid}'

        resp = session.get(

            url.format(limit=limit, sid=sid, partyid=department_id))

        text = resp.text

        results = re.findall(regexp, text)


        for item in results:

            all_emails.append(item[3])

            print item[3]

            staff = dict(uin=item[0], pid=item[1], name=item[2], alias=item[3], sex=item[4], pos=item[

                         5], tel=item[6], birth=item[7], slave_alias=item[8], department=item[9], mobile=item[10])

            staff_infors.append(staff)


    with open(emailfile, 'w') as f:

        for item in all_emails:

            f.write(item + '\n')


    with open(departfile, 'w') as f:

        print_tree(root_department['id'], department_infor, 0, staff_infors, f)


    print("total email count: %i" % len(all_emails))

    print("total department count: %i" % len(department_ids))






还可以用这个。

http://www.ttlsa.com/python/fetch-mailaddress-and-corporate-schema-structure/


评论

© Sh4dow's Blog | Powered by LOFTER