yuketangHelperBUU/homework_Helpers.py at main · MuWinds/yuketangHelperBUU · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
# -*- coding: utf-8 -*-
# version:5.0
# developed by zk chen and MR.Li
# V3版本仅能刷项目管理概论作业题
# V4版本由李同学改良，可以刷用户名下所有的课程的线上作业
# V5版本旨在跨学院使用，在微电子学院网课中发现了填空题类型，因此兼容了填空题，另外增加了交互，可以选择想刷哪个课程
import hashlib
import requests
from fontTools.ttLib import TTFont
from html import unescape
import re
import json
from io import BytesIO
import get_info

domain = input('输入雨课堂域名：(BUU输入buu.yuketang.cn)')
cookies = get_info.getCookies(domain)
csrftoken, sessionid = get_info.extract_specific_cookies(cookies)  # 需改成自己的
university_id = get_info.getUniversityId(domain)  # 需改成自己的
university_id = str(university_id)

# 会自动跳过已经完成的题目，无须担心，如果运行一遍后，仍有遗漏，再次运行即可。
# 因为作业答案在网页接口中返回了，因此本脚本才能自动答题
headers = {
    'User-Agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_4) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/87.0.4280.67 Safari/537.36',
    'Content-Type': 'application/json',
    'Cookie': 'csrftoken=' + csrftoken + '; sessionid=' + sessionid + '; university_id=' + str(university_id) + '; platform_id=3',
    'x-csrftoken': csrftoken,
    'sec-fetch-dest': 'empty',
    'sec-fetch-mode': 'cors',
    'sec-fetch-site': 'same-origin',
    'university-id': university_id,
    'xtbz': 'cloud'
}

leaf_type = {
    "video": 0,
    "homework": 6,
    "exam": 5,
    "recommend": 3,
    "discussion": 4
}

# 初始化缓存和源表
cache = {}
with open('SourceTable.json', 'r', encoding='utf-8') as f:
    source_table = json.load(f)


def gen_table(ttf):
    # 下载字体文件
    res = requests.get(ttf, headers=headers)
    font_data = BytesIO(res.content)
    font = TTFont(font_data)

    # 解析字形路径并生成MD5表
    table = {}
    cmap = font.getBestCmap()
    for code in range(19968, 40870):
        if code not in cmap:
            continue
        glyph_name = cmap[code]
        glyph = font['glyf'][glyph_name]

        # 提取字形轮廓数据并序列化
        path = []
        if glyph.isComposite():
            for comp in glyph.components:
                path.append(f"component:{comp.glyphName}")
        elif glyph.numberOfContours > 0:
            for contour in glyph.coordinates:
                path.append(f"contour:{list(contour)}")

        if path:
            path_str = json.dumps(path)
            md5 = hashlib.md5(path_str.encode()).hexdigest()
            table[code] = md5
    cache[ttf] = table


def get_encrypt_string(s, ttf):
    global cache, source_table
    if ttf not in cache:
        gen_table(ttf)

    # 匹配加密部分
    # 假设data_str是用户提供的原始JSON字符串
    # 解析为字典
    data_dict = json.loads(s)
    # 递归遍历字典中的所有字符串值

    def find_encrypted_text(obj):
        results = []
        if isinstance(obj, dict):
            for value in obj.values():
                results.extend(find_encrypted_text(value))
        elif isinstance(obj, list):
            for item in obj:
                results.extend(find_encrypted_text(item))
        elif isinstance(obj, str):
            # 应用正则表达式
            pattern = r'<span class="xuetangx-com-encrypted-font">(.*?)</span>'
            matches = re.findall(pattern, obj)
            results.extend(matches)
        return results
    matches = find_encrypted_text(data_dict)
    for enc_str in matches:
        dec_str = []
        for char in enc_str:
            code = ord(char)
            md5 = cache[ttf].get(code)
            if md5 in source_table:
                print(md5)
                dec_char = chr(source_table[md5])
                dec_str.append(dec_char)
            else:
                dec_str.append(char)
        s = s.replace(
            f'<span class="xuetangx-com-encrypted-font">{enc_str}</span>', ''.join(dec_str))

    return format_string(s)


def format_string(s):
    # HTML解码
    s = unescape(s)

    # 全角转半角
    s = ''.join([chr(ord(c) - 65248) if '\uff01' <=
                c <= '\uff5e' else c for c in s])

    # 标点替换
    replacements = {
        '“': '"', '”': '"',
        '‘': "'", '’': "'",
        '。': '.'
    }
    for k, v in replacements.items():
        s = s.replace(k, v)

    # 清理空格和结尾标点
    s = re.sub(r'\s+', ' ', s).strip()
    s = re.sub(r'[,.?:!;]$', '', s)
    return s


def do_homework(submit_url, classroom_id, course_sign, course_name):
    # second, need to get homework ids
    get_homework_ids = "https://"+domain+"/mooc-api/v1/lms/learn/course/chapter?cid=" + \
        str(classroom_id)+"&term=latest&uv_id=" + \
        university_id+"&sign="+course_sign
    homework_ids_response = requests.get(url=get_homework_ids, headers=headers)
    print(homework_ids_response.text)
    homework_json = json.loads(homework_ids_response.text)
    homework_ids = []
    try:
        for i in homework_json["data"]["course_chapter"]:
            for j in i["section_leaf_list"]:
                if "leaf_list" in j:
                    for z in j["leaf_list"]:
                        # print(z['leaf_type'], z['name'], z['id'])
                        if z['leaf_type'] == leaf_type["homework"]:
                            print(z['name'], z['leaf_type'],
                                  leaf_type["homework"], z['id'])
                            homework_ids.append(z["id"])
                else:
                    if j['leaf_type'] == leaf_type["homework"]:
                        homework_ids.append(j["id"])
        print(course_name+"共有"+str(len(homework_ids))+"个作业喔！")
    except:
        print("fail while getting homework_ids!!! please re-run this program!")
        raise Exception(
            "fail while getting homework_ids!!! please re-run this program!")

    # finally, we have all the data needed
    for homework in homework_ids:
        get_leaf_type_id_url = "https://"+domain+"/mooc-api/v1/lms/learn/leaf_info/" + \
            str(classroom_id)+"/"+str(homework)+"/?term=latest&uv_id=3078"
        leaf_response = requests.get(url=get_leaf_type_id_url, headers=headers)
        try:
            leaf_id = json.loads(leaf_response.text)[
                "data"]["content_info"]["leaf_type_id"]
        except:
            continue
        problem_url = "https://"+domain+"/mooc-api/v1/lms/exercise/get_exercise_list/" + \
            str(leaf_id)+"/?term=latest&uv_id="+university_id
        id_response = requests.get(url=problem_url, headers=headers)
        dictionary = json.loads(id_response.text)
        font_ttf = dictionary['data']['font']
        decrypted_str = get_encrypt_string(id_response.text, font_ttf)
        dictionary = json.loads(decrypted_str)
        # print(dictionary)
        # try:
        #     delay_time = re.search(r'Expected available in(.+?)second.',response.text).group(1).strip()
        #     print("由于网络阻塞，万恶的雨课堂，要阻塞" +str(delay_time)+"秒")
        #     time.sleep(float(delay_time)+0.5)
        #     print("恢复工作啦～～")
        #     response = requests.post(url=submit_url, headers=headers, data=json.dumps(submit_json_data))
        # except:
        #     pass
        # time.sleep(0.5)
        # print(dictionary["data"]["name"] + "已经完成!")


if __name__ == "__main__":
    your_courses = []
    course = {}

    # first, need to get classroom_id
    get_classroom_id = "https://"+domain + \
        "/mooc-api/v1/lms/user/user-courses/?status=1&page=1&no_page=1&term=latest&uv_id=" + \
        university_id + ""
    submit_url = "https://"+domain + \
        "/mooc-api/v1/lms/exercise/problem_apply/?term=latest&uv_id="+university_id+""
    classroom_id_response = requests.get(url=get_classroom_id, headers=headers)
    try:
        for ins in json.loads(classroom_id_response.text)["data"]["product_list"]:
            your_courses.append({
                "course_name": ins["course_name"],
                "classroom_id": ins["classroom_id"],
                "course_sign": ins["course_sign"],
                "sku_id": ins["sku_id"],
                "course_id": ins["course_id"]
            })
    except Exception as e:
        print("fail while getting classroom_id!!! please re-run this program!")
        raise Exception(
            "fail while getting classroom_id!!! please re-run this program!")
    for index, value in enumerate(your_courses):
        print("编号："+str(index+1)+" 课名："+str(value["course_name"]))
    number = input("你想刷哪门课呢?请输入编号。输入0表示全部课程都刷一遍\n")
    if int(number) == 0:
        for ins in your_courses:
            do_homework(submit_url, ins["classroom_id"],
                        ins["course_sign"], ins["course_name"])
    else:
        number = int(number)-1
        do_homework(submit_url, your_courses[number]["classroom_id"],
                    your_courses[number]["course_sign"], your_courses[number]["course_name"])