You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

62 lines
1.2 KiB

4 years ago
  1. import SentSeg
  2. sent_seg = SentSeg.SentSeg('de')
  3. sentences = sent_seg.ReadDoc2Sent('test2')
  4. print('sentences after ReadDoc2Sent', sentences)
  5. sent_seg.LoadSentGlueSGDandGSUtils()
  6. #sentences = sent_seg.CommaSentenceOrNot(sentences)
  7. #print('sentences after CommaSentenceOrNot', sentences)
  8. #sentences = sent_seg.GetUtteranceNumber(sentences)
  9. #print('sentences after GetUtteranceNumber', sentences)
  10. #sentences = sent_seg.GetQuestionOrNot(sentences)
  11. #print( 'sentences after GetQuestionOrNot', sentences)
  12. ##print(sent_seg.AndOrSolver(sentences))
  13. #print('sentences', sentences)
  14. #sentences = sent_seg.EnumerationSolver(sentences)
  15. #print('sent 2 ', sentences)
  16. sentences = sent_seg.CommaSentenceOrNot(sentences)
  17. print('sentences after CommaSentenceOrNot', sentences)
  18. sentences = sent_seg.GetUtteranceNumber(sentences)
  19. print('sentences after GetUtteranceNumber', sentences)
  20. sentences = sent_seg.GetQuestionOrNot(sentences)
  21. print( 'sentences after GetQuestionOrNot', sentences)
  22. #sent_seg.LoadBoWModelAndDatabaseOnesZeros()
  23. sentences1 = sent_seg.SplitSentencesIntoHauptNebenTuple(sentences)
  24. print('sentences after Split into Hauptnebentuple ',sentences1)
  25. print(sent_seg.SplitCommatas(sentences1))