2023-07-24 22:31:00 +02:00
|
|
|
|
import re
|
|
|
|
|
import numpy as np
|
|
|
|
|
|
|
|
|
|
|
2023-07-04 19:15:21 +02:00
|
|
|
|
def word_count(text):
|
|
|
|
|
c = []
|
|
|
|
|
final = {}
|
|
|
|
|
a = re.sub("[^А-Яа-я-A-Z-a-z ]", "", text).lower()
|
|
|
|
|
b = str(a).split()
|
|
|
|
|
c = list(b)
|
|
|
|
|
unique_array, count_array = np.unique(c, return_counts=True)
|
|
|
|
|
final = zip(unique_array, count_array)
|
|
|
|
|
final2 = list(final)
|
|
|
|
|
return final2
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
f = 'Я пришел, я ушел, я нашел'
|
|
|
|
|
|
|
|
|
|
print(word_count(f))
|