run.py 556 B

12345678910111213141516
  1. from tools import documents_extractor
  2. from transcript_extractor import rectify_transcript
  3. transcript = "E:\\project\\arbitration_system\\transcript_extractor\\test\\庭审笔录.PDF"
  4. def transcript_extractor_run(transcript):
  5. reader = documents_extractor.DocumentReader()
  6. result_reader = reader.process_input(transcript)
  7. print(result_reader)
  8. rectify_client = rectify_transcript.RectifyClient_transcript()
  9. result_rectify = rectify_client.clean_text(result_reader)
  10. return result_rectify
  11. print(transcript_extractor_run(transcript))