python源码通过词语标记化器tokenize提取注释并正则匹配测试用例作者名
提取代码如下
import tokenize import re with tokenize.open('readcomment.py') as f: list = [] for toktype, tok, start, end, line in tokenize.generate_tokens(f.readline): if toktype == tokenize.COMMENT: if re.search(r'Author:(.+)', tok): a = re.findall(r'Author:(.+)', tok)[0].replace(" ","") print(a) list.append(a) print(list)
例如源码如下
def say_hello(): # Author:吴彦祖 """ 注册api_lib.application.core下的所有业务接口类到register :return: """ print("Hello, World!") # Author: 刘亦菲 if __name__ == '__main__': # 这里是main say_hello()
执行结果
吴彦祖
刘亦菲
['吴彦祖', '刘亦菲']
浙公网安备 33010602011771号