from nltk.corpus import PlaintextCorpusReader
corpora_folder = '/home/flem/text/rejection/new'
corpus = PlaintextCorpusReader(corpora_folder, '^\w.*\.txt')
corpus.fileids()
['wholetext.txt']
corpus.sents()
[['Sorry', ',', 'all', 'rooms', ',', 'studios', ',', 'apartments', 'and', 'houses', 'are', 'no', 'longer', 'available', '.'], ['Everything', 'is', 'fully', 'booked', '.'], ...]
import nltk
my_text = nltk.Text(corpus.words())
corpus.words()
['Sorry', ',', 'all', 'rooms', ',', 'studios', ',', ...]
my_text.concordance('unfortunately')
Displaying 16 of 16 matches: ything is fully booked . You are unfortunately too late . I wish you all the be erty is like most of our housing unfortunately not for students . Unfortunately unfortunately not for students . Unfortunately , it is not possible to qualify to complete your application but unfortunately , your score was not high enough cial media in the coming weeks . Unfortunately , due to the volume of applicant international study experience . Unfortunately after careful review of your app se that are of interest to you . Unfortunately , we will not be moving forward reciate your time and interest . Unfortunately we have already undertaken a han through we shall be in contact . Unfortunately , with this being a student prop you , please just let us know . Unfortunately this property has already been t ything similar comes available . Unfortunately we received the following statem partment with two other people . Unfortunately , we are not allowed to rent out inconvenience . Enjoy your day . Unfortunately , you have not been randomly sel ything is fully booked . You are unfortunately too late . I wish you all the be we hope to meet in the future . Unfortunately , we will not be moving forward site for future roles with us . Unfortunately , we will not be moving forward
my_text.concordance('sorry')
Displaying 10 of 10 matches: Sorry , all rooms , studios , apartments a y success in the future , I ’ m very sorry to inform you that you are not a fin s available for two persons . We are sorry for the inconvenience . Enjoy your d f an extra place becomes available . Sorry , all rooms , studios , apartments a ve informed you Sufficiently . I ’ m sorry to say , however we cannot accept yo applying again in the future . I ’ m sorry to say that your submission was not act you to arrange a viewings . I am sorry but the landlord of this property wi nd will be closing the ad todayI ’ m sorry this property is already under appli rovide our standard service . We are sorry we cannot answer everyone immediatel tlist for the next stage and we ’ re sorry to have to let you know that we won
my_text.concordance('regret')
Displaying 3 of 3 matches: have informed you sufficiently . We regret to inform you that all rooms availa for your interest in this role . We regret to inform you that your application internal changes . As a result , we regret to tell you that we no longer have
my_text.concordance('reject')
Displaying 1 of 1 matches: e Animation academic who has had to reject your application . You indicate you
my_text.common_contexts(["regret", "available"])
No common contexts were found
my_text.collocations()
fully booked; moving forward; get back; luck hunting; next stage; clearly stated; questions please; really appreciate; longer available; would like; student property
my_text.dispersion_plot(["unfortunately", "regret", "sorry", "not"])
my_text.generate()
Building ngram index...
moment . . available . I hope to have informed you Sufficiently . under application . and interest . hesitate to contact me . . for more roles that may be in contact . Apart from the Animation academic who has had to reject your application . your application but unfortunately , your score was not chosen as one of the limited number of applications to put forward to the volume of applications we receive we cannot accept your application , but we ultimately narrowed applicants down to 10 finalists . like to thank you for your interest in this
'moment . . available . I hope to have informed you Sufficiently .\nunder application . and interest . hesitate to contact me . . for more\nroles that may be in contact . Apart from the Animation academic who\nhas had to reject your application . your application but\nunfortunately , your score was not chosen as one of the limited number\nof applications to put forward to the volume of applications we\nreceive we cannot accept your application , but we ultimately narrowed\napplicants down to 10 finalists . like to thank you for your interest\nin this'
my_text.collocations()
fully booked; moving forward; get back; luck hunting; next stage; clearly stated; questions please; really appreciate; longer available; would like; student property
my_text.count("unfortunately")
4
from nltk.book import FreqDist
fdist_words = FreqDist(my_text)
fdist_words
*** Introductory Examples for the NLTK Book *** Loading text1, ..., text9 and sent1, ..., sent9 Type the name of the text or sentence to view it. Type: 'texts()' or 'sents()' to list the materials. text1: Moby Dick by Herman Melville 1851 text2: Sense and Sensibility by Jane Austen 1811 text3: The Book of Genesis text4: Inaugural Address Corpus text5: Chat Corpus text6: Monty Python and the Holy Grail text7: Wall Street Journal text8: Personals Corpus text9: The Man Who Was Thursday by G . K . Chesterton 1908
FreqDist({'.': 91, 'to': 60, 'the': 50, 'you': 49, ',': 47, 'we': 43, 'for': 38, 'your': 34, 'and': 33, 'a': 28, ...})
fdist_words.most_common(50)
[('.', 91), ('to', 60), ('the', 50), ('you', 49), (',', 47), ('we', 43), ('for', 38), ('your', 34), ('and', 33), ('a', 28), ('this', 28), ('not', 27), ('of', 24), ('be', 22), ('in', 22), ('have', 21), ('is', 20), ('that', 18), ('are', 17), ('application', 16), ('I', 15), ('We', 15), ('will', 14), ('property', 12), ('our', 12), ('Unfortunately', 12), ('with', 11), ('interest', 11), ('’', 10), ('if', 10), ('on', 10), ('an', 9), ('but', 8), ('sorry', 8), ('all', 7), ('available', 7), ('any', 7), ('contact', 7), ('would', 7), ('future', 7), ('were', 7), ('has', 7), ('please', 6), ('it', 6), ('as', 6), ('applications', 6), ('t', 6), ('Please', 6), ('let', 6), ('If', 5)]
fdist_words.plot()
<AxesSubplot:xlabel='Samples', ylabel='Counts'>
fdist_words.tabulate(samples=my_text[:10])
Sorry , all rooms , studios , apartments and houses 2 47 7 3 47 2 47 3 33 2
step = 10
for iteration in range(0, len(my_text), step):
fdist_words.tabulate(samples=my_text[iteration:iteration+step])
Sorry , all rooms , studios , apartments and houses 2 47 7 3 47 2 47 3 33 2 are no longer available . Everything is fully booked . 17 4 3 7 91 2 20 3 4 91 You are unfortunately too late . I wish you all 4 17 4 4 2 91 15 4 49 7 the best of luck hunting for a place to live 50 2 24 2 2 38 28 4 60 3 . If you have any questions please do not hesitate 91 5 49 21 7 2 6 4 27 2 to contact me . I hope to have informed you 60 7 3 91 15 4 60 21 3 49 Sufficiently . However , this property is like most of 2 91 2 47 28 12 20 3 1 24 our housing unfortunately not for students . Unfortunately , it 12 1 4 27 38 4 91 12 47 6 is not possible to qualify for this property as a 20 27 3 60 1 38 28 12 6 28 student . This means that we cannot schedule a viewing 3 91 3 1 18 43 5 2 28 3 for this property with you at the moment . We 38 28 12 11 49 5 50 2 91 15 would be happy to schedule another appointment with you in 7 22 1 60 2 1 1 11 49 22 the future . Hope to have informed you sufficiently . 50 7 91 1 60 21 3 49 1 91 We regret to inform you that all rooms available for 15 3 60 5 49 18 7 3 7 38 full degree students are fully booked . We really appreciate 1 1 4 17 3 4 91 15 3 5 your interest the time taken to complete your application but 34 11 50 5 2 60 1 34 16 8 unfortunately , your score was not high enough to proceed 4 47 34 1 4 27 2 2 60 1 to the next stage . Whilst this may not be 60 50 2 2 91 1 28 3 27 22 the news you were hoping to hear , we were 50 1 49 7 1 60 1 47 43 7 lucky enough to have received over 4 , 500 applications 1 2 60 21 2 1 1 47 1 6 for only 9 internships , so don ’ t be 38 4 1 1 47 3 1 10 6 22 too disheartened . Even if you were able to secure 4 1 91 1 10 49 7 1 60 1 a place this year , this doesn ’ t mean 28 4 28 3 47 28 2 10 6 2 publishing isn ’ t for you . You can find 1 1 10 6 38 49 91 4 4 1 our currently live entry - level role here and we 12 4 3 2 4 1 3 3 33 43 will be opening applications for our positive action traineeship The 14 22 1 6 38 12 1 1 1 2 Scheme on 20th April . Find out if you ’ 1 10 1 1 91 1 3 10 49 10 re eligible here . We wish you every success in 2 2 3 91 15 4 49 1 1 22 the future , I ’ m very sorry to inform 50 7 47 15 10 5 2 8 60 5 you that you are not a finalist . We are 49 18 49 17 27 28 1 91 15 17 grateful for your entry to the scholarship and can assure 1 38 34 2 60 50 2 33 4 1 you that your essay was read and considered by at 49 18 34 1 4 1 33 2 4 5 least two members of our scholarship committee . The competition 1 3 1 24 12 2 2 91 2 1 was intense . Many applicants met our criteria of an 4 1 91 1 3 1 12 1 24 9 ideal candidate , and many had great answers for choosing 1 1 47 33 2 2 1 1 38 1 their country of study and how they planned to evolve 2 1 24 2 33 1 1 1 60 1 into a globally - minded leader – but we ultimately 1 28 1 4 1 1 1 8 43 1 narrowed applicants down to 10 finalists . We will inform 1 3 1 60 1 3 91 15 14 5 the finalists this week and will be announcing the winner 50 3 28 2 33 14 22 2 50 1 on our website and on social media in the coming 10 12 1 33 10 1 1 22 50 1 weeks . Unfortunately , due to the volume of applicants 1 91 12 47 3 60 50 2 24 3 we cannot provide you with any personalized feedback on your 43 5 2 49 11 7 1 1 10 34 application . Thank you for your application and we wish 16 91 2 49 38 34 16 33 43 4 you a wonderful and rewarding international study experience . Unfortunately 49 28 1 33 1 1 2 2 91 12 after careful review of your application we have decided to 2 1 2 24 34 16 43 21 1 60 pursue other candidates whose background more closely matches the specific 1 4 3 1 1 3 2 1 50 2 skills and / or experience required for the job . 1 33 2 1 2 1 38 50 1 91 Please continue to review our open positions online and apply 6 1 60 2 12 1 1 1 33 2 to those that are of interest to you . Unfortunately 60 3 18 17 24 11 60 49 91 12 , we will not be moving forward with your application 47 43 14 27 22 3 4 11 34 16 , but we appreciate your time and interest . Unfortunately 47 8 43 5 34 5 33 11 91 12 we have already undertaken a handful of viewings at the 43 21 4 1 28 1 24 2 5 50 flat . If the current interests falls through we shall 1 91 5 50 1 1 1 2 43 1 be in contact . Unfortunately , with this being a 22 22 7 91 12 47 11 28 1 28 student property it would not be suitable for those who 3 12 6 7 27 22 3 38 3 3 are in employment I ' m afraid . Of course 17 22 1 15 5 5 3 91 1 1 if you still were interested in taking a room there 10 49 1 7 1 22 1 28 2 4 then we can certainly arrange a viewing for you , 1 43 4 2 2 28 3 38 49 47 please just let us know . Unfortunately this property has 6 4 6 4 5 91 12 28 12 7 already been taken and the tenant is going through referencing 4 4 2 33 50 2 20 1 2 1 . I have added your details to our system and 91 15 21 1 34 1 60 12 1 33 will get back in touch if anything similar comes available 14 2 2 22 2 10 1 1 1 7 . Unfortunately we received the following statement from the Animation 91 12 43 2 50 2 1 3 50 1 academic who has had to reject your application . You 1 3 7 2 60 1 34 16 91 4 indicate you want to rent an apartment with two other 1 49 2 60 4 9 3 11 3 4 people . Unfortunately , we are not allowed to rent 2 91 12 47 43 17 27 2 60 4 out this specific apartment to three people as the municipality 3 28 2 3 60 2 2 6 50 1 has recently introduced new rules . At the moment we 7 1 1 1 1 91 1 50 2 43 only have properties available for two persons . We are 4 21 3 7 38 3 2 91 15 17 sorry for the inconvenience . Enjoy your day . Unfortunately 8 38 50 1 91 1 34 1 91 12 , you have not been randomly selected this time , 47 49 21 27 4 1 1 28 5 47 but we may be in touch if an extra place 8 43 3 22 22 2 10 9 1 4 becomes available . Sorry , all rooms , studios , 1 7 91 2 47 7 3 47 2 47 apartments and houses are no longer available . Everything is 3 33 2 17 4 3 7 91 2 20 fully booked . You are unfortunately too late . I 3 4 91 4 17 4 4 2 91 15 wish you all the best of luck hunting for a 4 49 7 50 2 24 2 2 38 28 place to live . If you have any questions please 4 60 3 91 5 49 21 7 2 6 do not hesitate to contact me . I hope to 4 27 2 60 7 3 91 15 4 60 have informed you Sufficiently . I ’ m sorry to 21 3 49 2 91 15 10 5 8 60 say , however we cannot accept your application this year 2 47 1 43 5 3 34 16 28 3 , as it is now too far after the deadline 47 6 6 20 3 4 1 2 50 1 and the committee has already completed their reviews of all 33 50 2 7 4 1 2 1 24 7 the applications . I hope you understand and would consider 50 6 91 15 4 49 1 33 7 1 applying again in the future . I ’ m sorry 2 3 22 50 7 91 15 10 5 8 to say that your submission was not chosen by the 60 2 18 34 1 4 27 3 4 50 jury this year . We will be announcing the winners 1 28 3 91 15 14 22 2 50 3 this week , but we wanted to notify you in 28 2 47 8 43 1 60 1 49 22 advance . Please be assured : even though you were 1 91 6 22 1 2 1 1 49 7 not chosen as one of the top winners , this 27 3 6 2 24 50 1 3 47 28 does not mean we think your photos are not good 2 27 2 43 1 34 1 17 27 1 ! Because of the limited number of spots for winners 1 1 24 50 1 3 24 1 38 3 and finalists , a lot of truly excellent submissions could 33 3 47 28 1 24 1 1 1 1 not be chosen for the final cut made by the 27 22 3 38 50 1 1 2 4 50 judges . We have considered your application and would like 1 91 15 21 2 34 16 33 7 3 to thank you for your interest in this role . 60 2 49 38 34 11 22 28 3 91 We regret to inform you that your application has not 15 3 60 5 49 18 34 16 7 27 been progressed . Do keep an eye on our opportunities 4 1 91 1 4 9 2 10 12 2 page for more roles that may be of interest . 1 38 3 2 18 3 22 24 11 91 If you would like advice on future applications , please 5 49 7 3 1 10 7 6 47 6 email here . First of all , we really want 2 3 91 1 24 7 47 43 3 2 to thank you for your interest . Since your application 60 2 49 38 34 11 91 1 34 16 , you haven ' t heard from us in a 47 49 1 5 6 1 3 4 22 28 while . Apart from the August holidays , that ' 1 91 1 3 50 1 1 47 18 5 s because we have been managing internal changes . As 2 1 43 21 4 1 1 1 91 4 a result , we regret to tell you that we 28 1 47 43 3 60 1 49 18 43 no longer have a vacancy for this position available . 4 3 21 28 2 38 28 3 7 91 However , we foresee that in some months we might 2 47 43 1 18 22 2 1 43 1 have to return to this process . As such , 21 60 1 60 28 1 91 4 1 47 we would be keen to keep your profile on file 43 7 22 1 60 4 34 1 10 1 and contact you in case of any future opportunities . 33 7 49 22 2 24 7 7 2 91 Thank you again for your interest and we hope to 2 49 3 38 34 11 33 43 4 60 meet in the future . Unfortunately , we will not 1 22 50 7 91 12 47 43 14 27 be moving forward with your application , but we appreciate 22 3 4 11 34 16 47 8 43 5 your time and interest . Just to let you know 34 5 33 11 91 1 60 6 49 5 out of courtesy our property on Killigrew Street is now 3 24 1 12 12 10 1 1 20 3 let agreed . Please let us know if you see 6 1 91 6 6 4 5 10 49 1 any other properties that interest you . This property currently 7 4 3 18 11 49 91 3 12 4 has an application submitted subject to references and credit checks 7 9 16 1 1 60 1 33 1 1 . I am afraid the property you have enquired about 91 15 4 3 50 12 49 21 1 2 is not a student property , and ideally the landlord 20 27 28 3 12 47 33 1 50 3 would be looking for a professional couple / family to 7 22 3 38 28 1 2 2 1 60 take the property . I will certainly keep you in 1 50 12 91 15 14 2 4 49 22 mind if any suitable properties come up . We do 1 10 7 3 3 1 1 91 15 4 have a number of applications to put forward to the 21 28 3 24 6 60 1 4 60 50 landlord , if he does not accept any of them 3 47 10 1 2 27 3 7 24 1 we will contact you to arrange a viewings . I 43 14 7 49 60 2 28 2 91 15 am sorry but the landlord of this property will not 4 8 8 50 3 24 28 12 14 27 accept students . I am just emailing in regard to 3 4 91 15 4 4 1 22 1 60 the enquiry you made about a room we have to 50 2 49 2 2 28 2 43 21 60 rent in Penryn . I am afraid that this is 4 22 1 91 15 4 3 18 28 20 not suitable for a couple - it is for one 27 3 38 28 2 4 6 20 38 2 person only . Thanks for your enquiry , we have 2 4 91 2 38 34 2 47 43 21 just accepted a tenant and will be closing the ad 4 1 28 2 33 14 22 1 50 1 todayI ’ m sorry this property is already under application 1 10 5 8 28 12 20 4 1 16 . It is not possible to rent this apartment with 91 1 20 27 3 60 4 28 3 11 a guarantor . Due to an extremely high number of 28 1 91 1 60 9 1 2 3 24 viewing requests , Riva is currently very difficult to reach 3 2 47 1 20 4 2 1 60 1 by phone and email . We receive so many requests 4 1 33 2 91 15 2 3 2 2 we can not provide our standard service . We are 43 4 27 2 12 1 1 91 15 17 sorry we cannot answer everyone immediately so please be patient 8 43 5 1 2 1 3 6 22 2 . If there is a permit for three persons it 91 5 4 20 28 1 38 2 2 6 ' s clearly stated in the advertisement and it is 5 2 2 3 22 50 1 33 6 20 also clearly stated if students are allowed . Only apply 1 2 3 10 4 17 2 91 1 2 for those apartments . Otherwise , there is no point 38 3 3 91 1 47 4 20 4 1 in submitting an application . Please be patient and we 22 1 9 16 91 6 22 2 33 43 will get back to you as soon as possible . 14 2 2 60 49 6 1 6 3 91 This e - mail is to inform you that your 3 1 4 1 20 60 5 49 18 34 contact person at your educational institution has not approved your 7 2 5 34 1 1 7 27 1 34 registration for accommodation due to the following reason : Fully 1 38 1 3 60 50 2 1 2 1 booked . We have now reached a shortlist for the 4 91 15 21 3 1 28 1 38 50 next stage and we ’ re sorry to have to 2 2 33 43 10 2 8 60 21 60 let you know that we won ’ t be progressing 6 49 5 18 43 1 10 6 22 1 with your application . We really appreciate you applying for 11 34 16 91 15 3 5 49 2 38 the role . On this occasion , there were just 50 3 91 1 28 1 47 4 7 4 some other candidates that more closely matched what we were 2 4 3 18 3 2 1 1 43 7 looking for in this position . Thanks again for your 3 38 22 28 3 91 2 3 38 34 interest and please do keep an eye on our careers 11 33 6 4 4 9 2 10 12 1 site for future roles with us . Unfortunately , we 1 38 7 2 11 4 91 12 47 43 will not be moving forward with your application , but 14 27 22 3 4 11 34 16 47 8 we appreciate your time and interest in Confidential . Please 43 5 34 5 33 11 22 1 91 6 note that due to the volume of applications we receive 1 18 3 60 50 2 24 6 43 2 we cannot contact everyone . As this is an internship 43 5 7 2 91 4 28 20 9 2 we are only looking for candidates who are currently enrolled 43 17 4 3 38 3 3 17 4 2 at a university ( and will remain enrolled throughout the 5 28 1 1 33 14 1 2 1 50 entire internship ). Based on your resume this doesn ' 1 2 1 1 10 34 1 28 2 5 t seem to be the case , meaning that you 6 1 60 22 50 2 47 1 18 49 are not eligible for this position . As the vacancy 17 27 2 38 28 3 91 4 50 2 stated , this is a strict requirement . Please feel 3 47 28 20 28 1 1 91 6 1 free to let me know if my assumption is wrong 1 60 6 3 5 10 1 1 20 1 . 91
vocabulary = set(my_text)
long_words = [w for w in vocabulary if len(w) > 4]
sorted(long_words)
['Animation', 'Apart', 'April', 'August', 'Based', 'Because', 'Confidential', 'Enjoy', 'Everything', 'First', 'Fully', 'However', 'Killigrew', 'Otherwise', 'Penryn', 'Please', 'Scheme', 'Since', 'Sorry', 'Street', 'Sufficiently', 'Thank', 'Thanks', 'Unfortunately', 'Whilst', 'about', 'academic', 'accept', 'accepted', 'accommodation', 'action', 'added', 'advance', 'advertisement', 'advice', 'afraid', 'after', 'again', 'agreed', 'allowed', 'already', 'announcing', 'another', 'answer', 'answers', 'anything', 'apartment', 'apartments', 'applicants', 'application', 'applications', 'apply', 'applying', 'appointment', 'appreciate', 'approved', 'arrange', 'assumption', 'assure', 'assured', 'available', 'background', 'because', 'becomes', 'being', 'booked', 'candidate', 'candidates', 'cannot', 'careers', 'careful', 'certainly', 'changes', 'checks', 'choosing', 'chosen', 'clearly', 'closely', 'closing', 'comes', 'coming', 'committee', 'competition', 'complete', 'completed', 'consider', 'considered', 'contact', 'continue', 'could', 'country', 'couple', 'course', 'courtesy', 'credit', 'criteria', 'current', 'currently', 'deadline', 'decided', 'degree', 'details', 'difficult', 'disheartened', 'doesn', 'educational', 'eligible', 'email', 'emailing', 'employment', 'enough', 'enquired', 'enquiry', 'enrolled', 'entire', 'entry', 'essay', 'every', 'everyone', 'evolve', 'excellent', 'experience', 'extra', 'extremely', 'falls', 'family', 'feedback', 'final', 'finalist', 'finalists', 'following', 'foresee', 'forward', 'fully', 'future', 'globally', 'going', 'grateful', 'great', 'guarantor', 'handful', 'happy', 'haven', 'heard', 'hesitate', 'holidays', 'hoping', 'houses', 'housing', 'however', 'hunting', 'ideal', 'ideally', 'immediately', 'inconvenience', 'indicate', 'inform', 'informed', 'institution', 'intense', 'interest', 'interested', 'interests', 'internal', 'international', 'internship', 'internships', 'introduced', 'judges', 'landlord', 'leader', 'least', 'level', 'limited', 'longer', 'looking', 'lucky', 'managing', 'matched', 'matches', 'meaning', 'means', 'media', 'members', 'might', 'minded', 'moment', 'months', 'moving', 'municipality', 'narrowed', 'notify', 'number', 'occasion', 'online', 'opening', 'opportunities', 'other', 'patient', 'people', 'permit', 'person', 'personalized', 'persons', 'phone', 'photos', 'place', 'planned', 'please', 'point', 'position', 'positions', 'positive', 'possible', 'proceed', 'process', 'professional', 'profile', 'progressed', 'progressing', 'properties', 'property', 'provide', 'publishing', 'pursue', 'qualify', 'questions', 'randomly', 'reach', 'reached', 'really', 'reason', 'receive', 'received', 'recently', 'references', 'referencing', 'regard', 'registration', 'regret', 'reject', 'remain', 'requests', 'required', 'requirement', 'result', 'resume', 'return', 'review', 'reviews', 'rewarding', 'roles', 'rooms', 'rules', 'schedule', 'scholarship', 'score', 'secure', 'selected', 'service', 'shall', 'shortlist', 'similar', 'skills', 'social', 'sorry', 'specific', 'spots', 'stage', 'standard', 'stated', 'statement', 'still', 'strict', 'student', 'students', 'studios', 'study', 'subject', 'submission', 'submissions', 'submitted', 'submitting', 'success', 'sufficiently', 'suitable', 'system', 'taken', 'taking', 'tenant', 'thank', 'their', 'there', 'think', 'those', 'though', 'three', 'through', 'throughout', 'todayI', 'touch', 'traineeship', 'truly', 'ultimately', 'under', 'understand', 'undertaken', 'unfortunately', 'university', 'vacancy', 'viewing', 'viewings', 'volume', 'wanted', 'website', 'weeks', 'while', 'whose', 'winner', 'winners', 'wonderful', 'would', 'wrong']
my_long_words = nltk.Text(long_words)
step = 10
for iteration in range(0, len(my_long_words), step):
fdist_words.tabulate(samples=my_long_words[iteration:iteration+step])
positive ultimately answer progressed employment progressing coming current longer thank 1 1 1 1 1 1 1 1 3 2 because required similar extra planned website complete subject criteria reach 1 1 1 1 1 1 1 1 1 1 result again position closing academic handful assumption submission country understand 1 3 3 1 1 1 1 1 1 1 Otherwise their holidays Please strict internal wrong educational evolve matches 1 2 1 6 1 1 1 1 1 1 action foresee contact viewing currently proceed credit agreed announcing received 1 1 7 3 4 1 1 1 2 2 August Penryn completed through shall think competition service continue roles 1 1 1 2 1 1 1 1 1 2 submitting remain traineeship other advance really careers lucky candidates Scheme 1 1 1 4 1 3 1 1 3 1 hunting considered online three allowed however Enjoy schedule closely system 2 2 1 2 2 1 1 2 2 1 internship interest stated whose couple taking applicants limited there Sorry 2 11 3 1 2 1 3 1 4 2 everyone entire those properties personalized tenant feedback positions months experience 2 1 3 3 1 2 1 1 1 2 introduced afraid accept added courtesy place reviews being rooms means 1 3 3 1 1 4 1 1 3 1 becomes skills Street indicate student entry pursue guarantor hesitate difficult 1 1 1 1 3 2 1 1 2 1 heard Confidential spots enrolled number Thanks meaning qualify accommodation consider 1 1 1 2 3 2 1 1 1 1 provide review Sufficiently sufficiently throughout inconvenience could return person profile 2 2 2 1 1 1 1 1 2 1 Animation students weeks Apart winner property going deadline forward details 1 4 1 1 1 12 1 1 4 1 sorry committee applying Fully enough after finalists referencing haven decided 8 2 2 1 2 2 3 1 1 1 degree inform least future municipality extremely statement study certainly questions 1 5 1 7 1 1 1 2 2 2 approved selected might success applications background regard available occasion people 1 1 1 1 6 1 1 7 1 2 studios ideally volume interested minded immediately Killigrew Since persons Whilst 2 1 2 1 1 1 1 1 2 1 housing wonderful secure rewarding touch already apartments professional enquired happy 1 1 1 1 2 4 3 1 1 1 truly disheartened suitable changes rules social application opening process references 1 1 3 1 1 1 16 1 1 1 about possible interests accepted moving winners falls university score advertisement 2 3 1 1 3 3 1 1 1 1 chosen Because regret leader please cannot enquiry landlord Thank permit 3 1 3 1 6 5 2 3 2 1 booked eligible randomly candidate moment receive another opportunities undertaken appointment 4 2 1 1 2 2 1 2 1 1 resume while notify great matched would finalist emailing registration wanted 1 1 1 1 1 7 1 1 1 1 judges still First narrowed excellent managing reached scholarship checks Unfortunately 1 1 1 1 1 1 1 2 1 12 stage standard requirement course doesn viewings final However grateful international 2 1 1 1 2 2 1 2 1 1 requests Everything recently appreciate anything institution though hoping choosing careful 2 2 1 5 1 1 1 1 1 1 essay level publishing intense answers taken media comes every unfortunately 1 1 1 1 1 2 1 1 1 4 assured vacancy members shortlist reject apartment clearly arrange reason April 1 2 1 1 1 3 2 2 1 1 ideal advice looking submissions family fully specific apply houses assure 1 1 3 1 1 3 2 2 2 1 todayI phone submitted internships point following informed Based patient globally 1 1 1 1 1 2 3 1 2 1 under photos email 1 1 2
for word in long_words:
count=my_text.count(word)
if count > 3 :
print(word*count)
PleasePleasePleasePleasePleasePlease contactcontactcontactcontactcontactcontactcontact currentlycurrentlycurrentlycurrently otherotherotherother interestinterestinterestinterestinterestinterestinterestinterestinterestinterestinterest theretheretherethere placeplaceplaceplace studentsstudentsstudentsstudents propertypropertypropertypropertypropertypropertypropertypropertypropertypropertypropertyproperty forwardforwardforwardforward sorrysorrysorrysorrysorrysorrysorrysorry informinforminforminforminform futurefuturefuturefuturefuturefuturefuture applicationsapplicationsapplicationsapplicationsapplicationsapplications availableavailableavailableavailableavailableavailableavailable alreadyalreadyalreadyalready applicationapplicationapplicationapplicationapplicationapplicationapplicationapplicationapplicationapplicationapplicationapplicationapplicationapplicationapplicationapplication pleasepleasepleasepleasepleaseplease cannotcannotcannotcannotcannot bookedbookedbookedbooked wouldwouldwouldwouldwouldwouldwould UnfortunatelyUnfortunatelyUnfortunatelyUnfortunatelyUnfortunatelyUnfortunatelyUnfortunatelyUnfortunatelyUnfortunatelyUnfortunatelyUnfortunatelyUnfortunately appreciateappreciateappreciateappreciateappreciate unfortunatelyunfortunatelyunfortunatelyunfortunately
--------------------------------------------------------------------------- AttributeError Traceback (most recent call last) /tmp/ipykernel_11116/135372240.py in <module> ----> 1 corpus.sentences() AttributeError: 'PlaintextCorpusReader' object has no attribute 'sentences'
from nltk.tokenize import word_tokenize
s="Sorry, all rooms, studios, apartments and houses are no longer available. Everything is fully booked. You are unfortunately too late. I wish you all the best of luck hunting for a place to live. If you have any questions please do not hesitate to contact me. I hope to have informed you Sufficiently. However, this property is like most of our housing unfortunately not for students. Unfortunately, it is not possible to qualify for this property as a student. This means that we cannot schedule a viewing for this property with you at the moment. We would be happy to schedule another appointment with you in the future. Hope to have informed you sufficiently. We regret to inform you that all rooms available for full degree students are fully booked. We really appreciate your interest the time taken to complete your application but unfortunately, your score was not high enough to proceed to the next stage. Whilst this may not be the news you were hoping to hear, we were lucky enough to have received over 4,500 applications for only 9 internships, so don’t be too disheartened. Even if you were able to secure a place this year, this doesn’t mean publishing isn’t for you. You can find our currently live entry-level role here and we will be opening applications for our positive action traineeship The Scheme on 20th April. Find out if you’re eligible here. We wish you every success in the future,I’m very sorry to inform you that you are not a finalist. We are grateful for your entry to the scholarship and can assure you that your essay was read and considered by at least two members of our scholarship committee. The competition was intense. Many applicants met our criteria of an ideal candidate, and many had great answers for choosing their country of study and how they planned to evolve into a globally-minded leader – but we ultimately narrowed applicants down to 10 finalists. We will inform the finalists this week and will be announcing the winner on our website and on social media in the coming weeks. Unfortunately, due to the volume of applicants we cannot provide you with any personalized feedback on your application. Thank you for your application and we wish you a wonderful and rewarding international study experience. Unfortunately after careful review of your application we have decided to pursue other candidates whose background more closely matches the specific skills and/or experience required for the job. Please continue to review our open positions online and apply to those that are of interest to you. Unfortunately, we will not be moving forward with your application, but we appreciate your time and interest. Unfortunately we have already undertaken a handful of viewings at the flat. If the current interests falls through we shall be in contact. Unfortunately, with this being a student property it would not be suitable for those who are in employment I'm afraid. Of course if you still were interested in taking a room there then we can certainly arrange a viewing for you, please just let us know. Unfortunately this property has already been taken and the tenant is going through referencing. I have added your details to our system and will get back in touch if anything similar comes available. Unfortunately we received the following statement from the Animation academic who has had to reject your application. You indicate you want to rent an apartment with two other people. Unfortunately, we are not allowed to rent out this specific apartment to three people as the municipality has recently introduced new rules. At the moment we only have properties available for two persons. We are sorry for the inconvenience. Enjoy your day. Unfortunately, you have not been randomly selected this time, but we may be in touch if an extra place becomes available. Sorry, all rooms, studios, apartments and houses are no longer available. Everything is fully booked. You are unfortunately too late. I wish you all the best of luck hunting for a place to live. If you have any questions please do not hesitate to contact me. I hope to have informed you Sufficiently. I’m sorry to say, however we cannot accept your application this year, as it is now too far after the deadline and the committee has already completed their reviews of all the applications. I hope you understand and would consider applying again in the future. I’m sorry to say that your submission was not chosen by the jury this year. We will be announcing the winners this week, but we wanted to notify you in advance. Please be assured: even though you were not chosen as one of the top winners, this does not mean we think your photos are not good! Because of the limited number of spots for winners and finalists, a lot of truly excellent submissions could not be chosen for the final cut made by the judges. We have considered your application and would like to thank you for your interest in this role. We regret to inform you that your application has not been progressed. Do keep an eye on our opportunities page for more roles that may be of interest. If you would like advice on future applications, please email here. First of all, we really want to thank you for your interest. Since your application, you haven't heard from us in a while. Apart from the August holidays, that's because we have been managing internal changes. As a result, we regret to tell you that we no longer have a vacancy for this position available. However, we foresee that in some months we might have to return to this process. As such, we would be keen to keep your profile on file and contact you in case of any future opportunities. Thank you again for your interest and we hope to meet in the future. Unfortunately, we will not be moving forward with your application, but we appreciate your time and interest. Just to let you know out of courtesy our property on Killigrew Street is now let agreed. Please let us know if you see any other properties that interest you. This property currently has an application submitted subject to references and credit checks. I am afraid the property you have enquired about is not a student property, and ideally the landlord would be looking for a professional couple/ family to take the property. I will certainly keep you in mind if any suitable properties come up. We do have a number of applications to put forward to the landlord, if he does not accept any of them we will contact you to arrange a viewings. I am sorry but the landlord of this property will not accept students.I am just emailing in regard to the enquiry you made about a room we have to rent in Penryn. I am afraid that this is not suitable for a couple - it is for one person only. Thanks for your enquiry, we have just accepted a tenant and will be closing the ad todayI’m sorry this property is already under application. It is not possible to rent this apartment with a guarantor. Due to an extremely high number of viewing requests, Riva is currently very difficult to reach by phone and email. We receive so many requests we can not provide our standard service. We are sorry we cannot answer everyone immediately so please be patient. If there is a permit for three persons it's clearly stated in the advertisement and it is also clearly stated if students are allowed. Only apply for those apartments. Otherwise, there is no point in submitting an application. Please be patient and we will get back to you as soon as possible. This e-mail is to inform you that your contact person at your educational institution has not approved your registration for accommodation due to the following reason: Fully booked. We have now reached a shortlist for the next stage and we’re sorry to have to let you know that we won’t be progressing with your application. We really appreciate you applying for the role. On this occasion, there were just some other candidates that more closely matched what we were looking for in this position. Thanks again for your interest and please do keep an eye on our careers site for future roles with us. Unfortunately, we will not be moving forward with your application, but we appreciate your time and interest in Confidential. Please note that due to the volume of applications we receive we cannot contact everyone. As this is an internship we are only looking for candidates who are currently enrolled at a university (and will remain enrolled throughout the entire internship). Based on your resume this doesn't seem to be the case, meaning that you are not eligible for this position. As the vacancy stated, this is a strict requirement. Please feel free to let me know if my assumption is wrong."
from nltk.tokenize import sent_tokenize, word_tokenize
sent_tokenize(s)
['Sorry, all rooms, studios, apartments and houses are no longer available.', 'Everything is fully booked.', 'You are unfortunately too late.', 'I wish you all the best of luck hunting for a place to live.', 'If you have any questions please do not hesitate to contact me.', 'I hope to have informed you Sufficiently.', 'However, this property is like most of our housing unfortunately not for students.', 'Unfortunately, it is not possible to qualify for this property as a student.', 'This means that we cannot schedule a viewing for this property with you at the moment.', 'We would be happy to schedule another appointment with you in the future.', 'Hope to have informed you sufficiently.', 'We regret to inform you that all rooms available for full degree students are fully booked.', 'We really appreciate your interest the time taken to complete your application but unfortunately, your score was not high enough to proceed to the next stage.', 'Whilst this may not be the news you were hoping to hear, we were lucky enough to have received over 4,500 applications for only 9 internships, so don’t be too disheartened.', 'Even if you were able to secure a place this year, this doesn’t mean publishing isn’t for you.', 'You can find our currently live entry-level role here and we will be opening applications for our positive action traineeship The Scheme on 20th April.', 'Find out if you’re eligible here.', 'We wish you every success in the future,I’m very sorry to inform you that you are not a finalist.', 'We are grateful for your entry to the scholarship and can assure you that your essay was read and considered by at least two members of our scholarship committee.', 'The competition was intense.', 'Many applicants met our criteria of an ideal candidate, and many had great answers for choosing their country of study and how they planned to evolve into a globally-minded leader – but we ultimately narrowed applicants down to 10 finalists.', 'We will inform the finalists this week and will be announcing the winner on our website and on social media in the coming weeks.', 'Unfortunately, due to the volume of applicants we cannot provide you with any personalized feedback on your application.', 'Thank you for your application and we wish you a wonderful and rewarding international study experience.', 'Unfortunately after careful review of your application we have decided to pursue other candidates whose background more closely matches the specific skills and/or experience required for the job.', 'Please continue to review our open positions online and apply to those that are of interest to you.', 'Unfortunately, we will not be moving forward with your application, but we appreciate your time and interest.', 'Unfortunately we have already undertaken a handful of viewings at the flat.', 'If the current interests falls through we shall be in contact.', "Unfortunately, with this being a student property it would not be suitable for those who are in employment I'm afraid.", 'Of course if you still were interested in taking a room there then we can certainly arrange a viewing for you, please just let us know.', 'Unfortunately this property has already been taken and the tenant is going through referencing.', 'I have added your details to our system and will get back in touch if anything similar comes available.', 'Unfortunately we received the following statement from the Animation academic who has had to reject your application.', 'You indicate you want to rent an apartment with two other people.', 'Unfortunately, we are not allowed to rent out this specific apartment to three people as the municipality has recently introduced new rules.', 'At the moment we only have properties available for two persons.', 'We are sorry for the inconvenience.', 'Enjoy your day.', 'Unfortunately, you have not been randomly selected this time, but we may be in touch if an extra place becomes available.', 'Sorry, all rooms, studios, apartments and houses are no longer available.', 'Everything is fully booked.', 'You are unfortunately too late.', 'I wish you all the best of luck hunting for a place to live.', 'If you have any questions please do not hesitate to contact me.', 'I hope to have informed you Sufficiently.', 'I’m sorry to say, however we cannot accept your application this year, as it is now too far after the deadline and the committee has already completed their reviews of all the applications.', 'I hope you understand and would consider applying again in the future.', 'I’m sorry to say that your submission was not chosen by the jury this year.', 'We will be announcing the winners this week, but we wanted to notify you in advance.', 'Please be assured: even though you were not chosen as one of the top winners, this does not mean we think your photos are not good!', 'Because of the limited number of spots for winners and finalists, a lot of truly excellent submissions could not be chosen for the final cut made by the judges.', 'We have considered your application and would like to thank you for your interest in this role.', 'We regret to inform you that your application has not been progressed.', 'Do keep an eye on our opportunities page for more roles that may be of interest.', 'If you would like advice on future applications, please email here.', 'First of all, we really want to thank you for your interest.', "Since your application, you haven't heard from us in a while.", "Apart from the August holidays, that's because we have been managing internal changes.", 'As a result, we regret to tell you that we no longer have a vacancy for this position available.', 'However, we foresee that in some months we might have to return to this process.', 'As such, we would be keen to keep your profile on file and contact you in case of any future opportunities.', 'Thank you again for your interest and we hope to meet in the future.', 'Unfortunately, we will not be moving forward with your application, but we appreciate your time and interest.', 'Just to let you know out of courtesy our property on Killigrew Street is now let agreed.', 'Please let us know if you see any other properties that interest you.', 'This property currently has an application submitted subject to references and credit checks.', 'I am afraid the property you have enquired about is not a student property, and ideally the landlord would be looking for a professional couple/ family to take the property.', 'I will certainly keep you in mind if any suitable properties come up.', 'We do have a number of applications to put forward to the landlord, if he does not accept any of them we will contact you to arrange a viewings.', 'I am sorry but the landlord of this property will not accept students.I am just emailing in regard to the enquiry you made about a room we have to rent in Penryn.', 'I am afraid that this is not suitable for a couple - it is for one person only.', 'Thanks for your enquiry, we have just accepted a tenant and will be closing the ad todayI’m sorry this property is already under application.', 'It is not possible to rent this apartment with a guarantor.', 'Due to an extremely high number of viewing requests, Riva is currently very difficult to reach by phone and email.', 'We receive so many requests we can not provide our standard service.', 'We are sorry we cannot answer everyone immediately so please be patient.', "If there is a permit for three persons it's clearly stated in the advertisement and it is also clearly stated if students are allowed.", 'Only apply for those apartments.', 'Otherwise, there is no point in submitting an application.', 'Please be patient and we will get back to you as soon as possible.', 'This e-mail is to inform you that your contact person at your educational institution has not approved your registration for accommodation due to the following reason: Fully booked.', 'We have now reached a shortlist for the next stage and we’re sorry to have to let you know that we won’t be progressing with your application.', 'We really appreciate you applying for the role.', 'On this occasion, there were just some other candidates that more closely matched what we were looking for in this position.', 'Thanks again for your interest and please do keep an eye on our careers site for future roles with us.', 'Unfortunately, we will not be moving forward with your application, but we appreciate your time and interest in Confidential.', 'Please note that due to the volume of applications we receive we cannot contact everyone.', 'As this is an internship we are only looking for candidates who are currently enrolled at a university (and will remain enrolled throughout the entire internship).', "Based on your resume this doesn't seem to be the case, meaning that you are not eligible for this position.", 'As the vacancy stated, this is a strict requirement.', 'Please feel free to let me know if my assumption is wrong.']
sentences=sent_tokenize(s)
fdist1 = FreqDist(s)
print(fdist1)
<FreqDist with 63 samples and 8663 outcomes>
sentences