Open Chinese Convert
0.4.3
A project for conversion between Traditional and Simplified Chinese
|
00001 #coding: utf-8 00002 00003 def sort_items(input_filename, output_filename): 00004 input_file = open(input_filename, "r") 00005 dic = {} 00006 00007 for line in input_file: 00008 if len(line) == 0: 00009 continue 00010 try: 00011 key, value = line.split("\t") 00012 except ValueError: 00013 print line 00014 while value[-1] == "\n" or value[-1] == "\r": 00015 value = value[:-1] 00016 dic[key] = value 00017 00018 input_file.close() 00019 00020 output_file = open(output_filename, "w") 00021 00022 for key in sorted(dic.iterkeys()): 00023 output_file.write(key + "\t" + dic[key] + "\n") 00024 00025 output_file.close() 00026 00027 def reverse_items(input_filename, output_filename): 00028 input_file = open(input_filename, "r") 00029 dic = {} 00030 00031 for line in input_file: 00032 if len(line) == 0: 00033 continue 00034 key, value = line.split("\t") 00035 while value[-1] == "\n" or value[-1] == "\r": 00036 value = value[:-1] 00037 00038 value_list = value.split(" ") 00039 for value in value_list: 00040 if dic.has_key(value): 00041 dic[value].append(key) 00042 else: 00043 dic[value] = [key] 00044 00045 input_file.close() 00046 00047 output_file = open(output_filename, "w") 00048 00049 for key in sorted(dic.iterkeys()): 00050 output_file.write(key + "\t" + " ".join(dic[key]) + "\n") 00051 00052 output_file.close() 00053 00054 def find_target_items(input_filename, keyword): 00055 input_file = open(input_filename, "r") 00056 for line in input_file: 00057 if len(line) == 0: 00058 continue 00059 key, value = line.split("\t") 00060 while value[-1] == "\n" or value[-1] == "\r": 00061 value = value[:-1] 00062 00063 value_list = value.split(" ") 00064 for value in value_list: 00065 if keyword in value: 00066 print line, 00067 00068 input_file.close()