Spaces:
Build error
Build error
| # copyright (c) 2020 PaddlePaddle Authors. All Rights Reserve. | |
| # | |
| # Licensed under the Apache License, Version 2.0 (the "License"); | |
| # you may not use this file except in compliance with the License. | |
| # You may obtain a copy of the License at | |
| # | |
| # http://www.apache.org/licenses/LICENSE-2.0 | |
| # | |
| # Unless required by applicable law or agreed to in writing, software | |
| # distributed under the License is distributed on an "AS IS" BASIS, | |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | |
| # See the License for the specific language governing permissions and | |
| # limitations under the License. | |
| import os | |
| import argparse | |
| import json | |
| def gen_rec_label(input_path, out_label): | |
| with open(out_label, 'w') as out_file: | |
| with open(input_path, 'r') as f: | |
| for line in f.readlines(): | |
| tmp = line.strip('\n').replace(" ", "").split(',') | |
| img_path, label = tmp[0], tmp[1] | |
| label = label.replace("\"", "") | |
| out_file.write(img_path + '\t' + label + '\n') | |
| def gen_det_label(root_path, input_dir, out_label): | |
| with open(out_label, 'w') as out_file: | |
| for label_file in os.listdir(input_dir): | |
| img_path = root_path + label_file[3:-4] + ".jpg" | |
| label = [] | |
| with open( | |
| os.path.join(input_dir, label_file), 'r', | |
| encoding='utf-8-sig') as f: | |
| for line in f.readlines(): | |
| tmp = line.strip("\n\r").replace("\xef\xbb\xbf", | |
| "").split(',') | |
| points = tmp[:8] | |
| s = [] | |
| for i in range(0, len(points), 2): | |
| b = points[i:i + 2] | |
| b = [int(t) for t in b] | |
| s.append(b) | |
| result = {"transcription": tmp[8], "points": s} | |
| label.append(result) | |
| out_file.write(img_path + '\t' + json.dumps( | |
| label, ensure_ascii=False) + '\n') | |
| if __name__ == "__main__": | |
| parser = argparse.ArgumentParser() | |
| parser.add_argument( | |
| '--mode', | |
| type=str, | |
| default="rec", | |
| help='Generate rec_label or det_label, can be set rec or det') | |
| parser.add_argument( | |
| '--root_path', | |
| type=str, | |
| default=".", | |
| help='The root directory of images.Only takes effect when mode=det ') | |
| parser.add_argument( | |
| '--input_path', | |
| type=str, | |
| default=".", | |
| help='Input_label or input path to be converted') | |
| parser.add_argument( | |
| '--output_label', | |
| type=str, | |
| default="out_label.txt", | |
| help='Output file name') | |
| args = parser.parse_args() | |
| if args.mode == "rec": | |
| print("Generate rec label") | |
| gen_rec_label(args.input_path, args.output_label) | |
| elif args.mode == "det": | |
| gen_det_label(args.root_path, args.input_path, args.output_label) | |