将系统中的字体保存为图片,为orc提供训练数据
一、字体库存储路径
win10系统字库文件所在的目录为c:\Windows\Fonts\
![](https://img.laitimes.com/img/_0nNw4CM6IyYiwiM6ICdiwiIwczX0xiRGZkRGZ0Xy9GbvNGL2EzXlpXazxSPrRlT5lFRPBTRywEMW1mY1RzRapnTtxkb5ckYplTeMZTTINGMShUYfRHelRHLwEzX39GZhh2css2RkBnVHFmb1clWvB3MaVnRtp1XlBXe0xyayFWbyVGdhd3LcV2Zh1Wa9M3clN2byBXLzN3btg3Pn5GcukTM1MzMxcTM0EDMxAjMwIzLc52YucWbp5GZzNmLn9Gbi1yZtl2Lc9CX6MHc0RHaiojIsJye.png)
二、字体库提取保存代码
代码中选择的字体库是Microsoft YaHei的,字库保存的代码如下
#encoding: utf-8
import os
import pygame
chinese_dir = 'chinese/'#要保存的目录
if not os.path.exists(chinese_dir):
os.mkdir(chinese_dir)
pygame.init()
start,end = (0x4E00, 0x9FA5) # 汉字编码范围
for codepoint in range(int(start), int(end)):
word = chr(codepoint)#求十进制或十六进制对应的字符
print(word)
#font = pygame.font.SysFont('Microsoft YaHei', 64)
font = pygame.font.Font("c:\Windows\Fonts\msyh.ttc", 64)
ftext = font.render(word, True, (0,0,0),(255, 255, 255))
pygame.image.save(ftext, (chinese_dir+ str(codepoint) + ".png"))