mirror of
https://github.com/caperren/school_archives.git
synced 2025-11-09 21:51:15 +00:00
Added work from my other class repositories before deletion
This commit is contained in:
@@ -0,0 +1,29 @@
|
||||
def split_by_periods(document):
|
||||
output_array = []
|
||||
|
||||
sentence_array_temp = ""
|
||||
|
||||
for current_char in document:
|
||||
if current_char != "\n":
|
||||
sentence_array_temp += current_char
|
||||
|
||||
if current_char == ".":
|
||||
output_array.append(sentence_array_temp)
|
||||
sentence_array_temp = ""
|
||||
|
||||
if sentence_array_temp:
|
||||
output_array.append(sentence_array_temp)
|
||||
|
||||
return output_array
|
||||
|
||||
|
||||
def kwic(document, listPairs=False, ignoreWords=None, periodsToBreaks=False):
|
||||
if not document:
|
||||
return []
|
||||
|
||||
if periodsToBreaks:
|
||||
split_into_sentences = split_by_periods(document)
|
||||
else:
|
||||
split_into_sentences = document.splitlines()
|
||||
|
||||
return split_into_sentences
|
||||
@@ -0,0 +1,29 @@
|
||||
from kwic import kwic
|
||||
|
||||
empty_document = ""
|
||||
design_words_doc = "Design is hard.\nLet's just implement."
|
||||
goodbye_buddy_doc = "Hello there.\nHello there, buddy.\nHello and goodbye, buddy.\nHello is like buddy Goodbye!"
|
||||
hello_buddy_periods = "Hello there. Hello there, buddy. Hello and goodbye, buddy. Hello is like buddy Goodbye!"
|
||||
|
||||
hello_buddy_periods_output = ["Hello there.", " Hello there, buddy.", " Hello and goodbye, buddy.",
|
||||
" Hello is like buddy Goodbye!"]
|
||||
|
||||
if __name__ == "__main__":
|
||||
# Ensure empty input gives empty output
|
||||
assert(kwic(empty_document) == [])
|
||||
|
||||
# Ensure real input does not produce empty output
|
||||
assert(kwic(design_words_doc) != [])
|
||||
|
||||
# Make sure it's broken into two lines
|
||||
assert(len(kwic(design_words_doc)) == 2)
|
||||
|
||||
# Make sure it's broken into four line
|
||||
assert(len(kwic(goodbye_buddy_doc)) == 4)
|
||||
|
||||
# Make sure line with just periods shows up as itself
|
||||
assert(kwic(hello_buddy_periods)[0] == hello_buddy_periods)
|
||||
|
||||
# Make sure it's broken into four lines once it's broken by periods instead
|
||||
# Also, this time it keeps the ending period like it's supposed to
|
||||
assert(kwic(hello_buddy_periods, periodsToBreaks=True) == hello_buddy_periods_output)
|
||||
Reference in New Issue
Block a user