python在txt文件中随机抽取样本

import random
if __name__ == '__main__':

    name = './data/trec/train.txt'
    with open(name, 'r', encoding='utf-8') as f:
        lines = f.readlines()#获取所有行
        sum = 0
        list = []
        for line in lines:#第i行
            #找到第一个空格
            list.append(line)
            # for j in range(len(line)):
            #     if line[j].isspace() == True:
            #         a = line[:j]
            #         # if a not in list:
            #         list.append(a)
            #         sum += 1


    with open('./data/trec/dev.txt', 'a', encoding='utf-8') as g:
        a = random.sample(list, 500)#随机抽取500行
        for i in a:
            g.write(i)
	f.close()
	g.clost()
    print(sum)
发布了50 篇原创文章 · 获赞 44 · 访问量 8896

猜你喜欢

转载自blog.csdn.net/tailonh/article/details/105525742