info_generate.py 7.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102
  1. import random
  2. import zhconv
  3. from tqdm import tqdm
  4. from zhconv import convert
  5. def random_name():
  6. # 删减部分小众姓氏
  7. # firstName = "赵钱孙李周吴郑王冯陈褚卫蒋沈韩杨朱秦尤许何吕施张孔曹严华金魏陶姜戚谢邹喻水云苏潘葛奚范彭郎鲁韦昌马苗凤花方俞任袁柳鲍史唐费岑薛雷贺倪汤滕殷罗毕郝邬安常乐于时傅卞齐康伍余元卜顾孟平" \
  8. # "黄和穆萧尹姚邵湛汪祁毛禹狄米贝明臧计成戴宋茅庞熊纪舒屈项祝董粱杜阮席季麻强贾路娄危江童颜郭梅盛林刁钟徐邱骆高夏蔡田胡凌霍万柯卢莫房缪干解应宗丁宣邓郁单杭洪包诸左石崔吉" \
  9. # "龚程邢滑裴陆荣翁荀羊甄家封芮储靳邴松井富乌焦巴弓牧隗山谷车侯伊宁仇祖武符刘景詹束龙叶幸司韶黎乔苍双闻莘劳逄姬冉宰桂牛寿通边燕冀尚农温庄晏瞿茹习鱼容向古戈终居衡步都耿满弘国文东殴沃曾关红游盖益桓公晋楚闫"
  10. # 百家姓姓氏
  11. firstName = "赵钱孙李周吴郑王冯陈褚卫蒋沈韩杨朱秦尤许何吕施张孔曹严华金魏陶姜戚谢邹喻柏水窦章云苏潘葛奚范彭郎鲁韦昌马苗凤花方俞任袁柳酆鲍史唐费廉岑薛雷贺倪汤滕殷罗毕郝邬安常乐于时傅皮卞齐康伍余元卜顾孟平" \
  12. "黄和穆萧尹姚邵湛汪祁毛禹狄米贝明臧计伏成戴谈宋茅庞熊纪舒屈项祝董粱杜阮蓝闵席季麻强贾路娄危江童颜郭梅盛林刁钟徐邱骆高夏蔡田樊胡凌霍虞万支柯昝管卢莫经房裘缪干解应宗丁宣贲邓郁单杭洪包诸左石崔吉钮" \
  13. "龚程嵇邢滑裴陆荣翁荀羊於惠甄麴家封芮羿储靳汲邴糜松井段富巫乌焦巴弓牧隗山谷车侯宓蓬全郗班仰秋仲伊宫宁仇栾暴甘钭厉戎祖武符刘景詹束龙叶幸司韶郜黎蓟薄印宿白怀蒲邰从鄂索咸籍赖卓蔺屠蒙池乔阴欎胥能苍" \
  14. "双闻莘党翟谭贡劳逄姬申扶堵冉宰郦雍舄璩桑桂濮牛寿通边扈燕冀郏浦尚农温别庄晏柴瞿阎充慕连茹习宦艾鱼容向古易慎戈廖庾终暨居衡步都耿满弘匡国文寇广禄阙东殴殳沃利蔚越夔隆师巩厍聂晁勾敖融冷訾辛阚那简饶空" \
  15. "曾毋沙乜养鞠须丰巢关蒯相查後荆红游竺权逯盖益桓公晋楚闫法汝鄢涂钦归海帅缑亢况后有琴梁丘左丘商牟佘佴伯赏南宫墨哈谯笪年爱阳佟言福百家姓终"
  16. # 百家姓中双姓氏
  17. firstName2 = "万俟司马上官欧阳夏侯诸葛闻人东方赫连皇甫尉迟公羊澹台公冶宗政濮阳淳于单于太叔申屠公孙仲孙轩辕令狐钟离宇文长孙慕容鲜于闾丘司徒司空亓官司寇仉督子颛孙端木巫马公西漆雕乐正壤驷公良拓跋夹谷宰父谷梁段干百里东郭南门呼延羊舌微生梁丘左丘东门西门南宫南宫"
  18. # # 女孩名字
  19. # girl = '秀娟英华慧巧美娜静淑惠珠翠雅芝玉萍红娥玲芬芳燕彩春菊兰凤洁梅琳素云莲真环雪荣爱妹霞香月莺媛艳瑞凡佳嘉琼勤珍贞莉桂娣叶璧璐娅琦晶妍茜秋珊莎锦黛青倩婷姣婉娴瑾颖露瑶怡婵雁蓓纨仪荷丹蓉眉君琴蕊薇菁梦岚苑婕馨瑗琰韵融园艺咏卿聪澜纯毓悦昭冰爽琬茗羽希宁欣飘育滢馥筠柔竹霭凝晓欢霄枫芸菲寒伊亚宜可姬舒影荔枝思丽'
  20. # # 男孩名字
  21. # boy = '伟刚勇毅俊峰强军平保东文辉力明永健世广志义兴良海山仁波宁贵福生龙元全国胜学祥才发武新利清飞彬富顺信子杰涛昌成康星光天达安岩中茂进林有坚和彪博诚先敬震振壮会思群豪心邦承乐绍功松善厚庆磊民友裕河哲江超浩亮政谦亨奇固之轮翰朗伯宏言若鸣朋斌梁栋维启克伦翔旭鹏泽晨辰士以建家致树炎德行时泰盛雄琛钧冠策腾楠榕风航弘'
  22. # # 名
  23. # name = '中笑贝凯歌易仁器义礼智信友上都卡被好无九加电金马钰玉忠孝'
  24. fp = open('materials/chinese_cht_dict.txt', 'r', encoding='utf-8')
  25. name = []
  26. for line in fp.readlines():
  27. name.append(line.rstrip('\n'))
  28. fp.close()
  29. # 地點
  30. addr = ['北市', '新北市', '中市', '桃市', '南市', '彰縣', '屛縣', '竹縣', '苗縣', '南縣', '雲縣', '嘉縣', '宜縣', '花縣', '臺縣', '澎縣', '金縣', '連縣']
  31. # 狀態
  32. state = ['初發', '補發', '換發']
  33. addr_id = random.randint(0, 17)
  34. a = addr[addr_id]
  35. state_id = random.randint(0, 2)
  36. s = state[state_id]
  37. # 10%的机遇生成双数姓氏
  38. if random.choice(range(100)) > 10:
  39. firstName_name = firstName[random.choice(range(len(firstName)))]
  40. else:
  41. i = random.choice(range(len(firstName2)))
  42. firstName_name = firstName2[i:i + 2]
  43. sex = random.choice(range(2))
  44. name_1 = ""
  45. # 生成并返回一个名字
  46. if sex > 0:
  47. name_1 = name[random.randint(0, len(name) - 1)]
  48. if random.choice(range(2)) > 0:
  49. name_1 += name[random.randint(0, len(name) - 1)]
  50. return firstName_name + name_1 + "\t女" +\
  51. '\t' + a + '\t' + s + '\t' + './person_imgs/lisa.png'
  52. else:
  53. name_1 = name[random.randint(0, len(name) - 1)]
  54. if random.choice(range(2)) > 0:
  55. name_1 += name[random.randint(0, len(name) - 1)]
  56. return firstName_name + name_1 + "\t男" + '\t' + a + '\t' + s + '\t' + './person_imgs/02.webp'
  57. fp = open('materials/name_cht.txt', 'w+', encoding='utf-8')
  58. for i in tqdm(range(2000)):
  59. s1 = random_name()
  60. name = s1.split('\t')[0]
  61. temp_str = ''
  62. if len(name) <= 6:
  63. num_of_space = (2 * (6 - len(name))) / (len(name) - 1)
  64. for i in range(0, len(name) - 1):
  65. temp_str += name[i]
  66. for j in range(0, int(num_of_space)):
  67. temp_str += ' '
  68. temp_str += name[len(name) - 1]
  69. name = temp_str
  70. sex = s1.split('\t')[1]
  71. addr = s1.split('\t')[2]
  72. state = s1.split('\t')[3]
  73. img = s1.split('\t')[4]
  74. birth_year = random.randint(0, 100)
  75. birth_month = random.randint(1, 12)
  76. birth_day = random.randint(1, 30)
  77. time_year = random.randint(0, 100)
  78. time_month = random.randint(1, 12)
  79. time_day = random.randint(1, 30)
  80. word_index = random.randint(0, 25)
  81. id = random.randint(0, 1000000000)
  82. # 字母
  83. word = ['A', 'B', 'C', 'D', 'E', 'F', 'G', 'H', 'I', 'J', 'K', 'L', 'M', 'N', 'O', 'P', 'Q', 'R', 'S', 'T', 'U',
  84. 'V', 'W', 'X', 'Y', 'Z']
  85. name = zhconv.convert(name, 'zh-tw')
  86. # print(name)
  87. # line = name + ',' + str(birth_year) + ',' + str(birth_month) + ',' + str(birth_day) + ',民國 ' + str(
  88. # time_year) + ' 年 ' + str(time_month) + ' 月 ' + str(time_day) + ' 日(' + addr + ')' + state + ',' + sex + ',' + word[word_index] + str(id).zfill(9) + ',' + img + '\n'
  89. # br = "民國 " + str(birth_year) + " 年 " + str(birth_month) + ' 月 ' + str(birth_day) + ' 日'
  90. # generate_date = '民國 ' + str(time_year) + ' 年 ' + str(time_month) + ' 月 ' + str(time_day) + ' 日(' + addr + ')' + state
  91. fp.write(name + '\n')