You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

83 lines
2.7 KiB

  1. import sys
  2. import dill
  3. dill.load_session('voilastate.db')
  4. inpu = sys.argv[1]
  5. try:
  6. outsentences, punctuations = oi.CellInputText2SplitsentencesWithspacy(inpu)
  7. except:
  8. out = 'Bitte auf die Zeichensetzung achten! '
  9. print(out)
  10. exit()
  11. outsentences = sy.replaceOpposites(outsentences)
  12. insentences = outsentences
  13. outsentences, punctuations = sent_seg.putAppendixesIntoOwnSentences(insentences, punctuations)
  14. insentences = outsentences
  15. sentsegformattedsentences = []
  16. for sentence in insentences:
  17. sentsegformattedsentences.append([sentence])
  18. #print(sentsegformattedsentences)
  19. sentences = sent_seg.CommaSentenceOrNot(sentsegformattedsentences)
  20. #print(sentences)
  21. sentences = sent_seg.GetUtteranceNumber(sentences)
  22. #print(sentences)
  23. sentences = sent_seg.GetQuestionOrNot(sentences)
  24. #print(sentences)
  25. sentences, punctuations = sent_seg.AndOrSolver(sentences, punctuations)
  26. #print(len(punctuations))
  27. #print('sentences after AndOrSolver', sentences, punctuations)
  28. sentences = sent_seg.CommaSentenceOrNot(sentences)
  29. #print(sentences)
  30. sentences = sent_seg.GetUtteranceNumber(sentences)
  31. #print(sentences)
  32. sentences = sent_seg.GetQuestionOrNot(sentences)
  33. #print(sentences)
  34. sentences, punctuations = sent_seg.SplitSentencesIntoHauptNebenTuple(sentences, punctuations)
  35. #print(len(punctuations))
  36. #print('sentences after split haupt neben', sentences)
  37. sentences = sent_seg.CommaSentenceOrNot(sentences)
  38. #print(sentences)
  39. sentences = sent_seg.GetUtteranceNumber(sentences)
  40. #print(sentences)
  41. sentences = sent_seg.GetQuestionOrNot(sentences)
  42. #print(sentences)
  43. outsentences, punctuations = sent_seg.SplitCommatas(sentences, punctuations)
  44. insentences = outsentences
  45. outsentences = solSh.ExplainShortsInSentencesWithBrackets(insentences)
  46. insentences = outsentences
  47. outsentences = p2a.replacePassivForms(insentences)
  48. insentences = outsentences
  49. outsentences = gs.ReplaceGenitivWithDativ(insentences)
  50. insentences = []
  51. for sentence in outsentences:
  52. insentences.append([word.replace('ö','oe').replace('ü','ue').replace('ä','ae').replace('ß','ss') for word in sentence])
  53. outsentences = cs.replaceConjunctives(insentences)
  54. insentences = outsentences
  55. outsentences, punctuations = fwb.fremdEintragAppend(insentences, punctuations)
  56. insentences = outsentences
  57. outsentences, punctuations = medi.Medioreplace(insentences, punctuations)
  58. out = ''
  59. #print('just before looking if the lenght is the same')
  60. #print(len(outsentences), len(punctuations))
  61. if len(outsentences) == len(punctuations):
  62. #print('the length is the same')
  63. for n in range(len(outsentences)):
  64. outsentence = outsentences[n]
  65. outsentence[0] = outsentence[0].title()
  66. out += ' '.join(outsentence) + punctuations[n] + '\n'
  67. print(out)