|
Bajardi: Axatov Asadbek
|
Sana | 13.03.2024 | Hajmi | 113.67 Kb. | | #170399 |
Bog'liq akbar1 signal1amaliAAA, diyor, Bekzod, jahpnd, KOMPAMALIYOT3, signallar, 8-9-19 asadmt, Data Storage. Preferences. SharedPreferences (1), 2-Mavzu Ma’lumot bazasining arxitekturasi va uch bosqichli arxi, azi, doston2, doston4, doston5FINISH, doston1, doston3
O’ZBEKISTON RESPUBLIKASI AXBOROT TEXNOLOGIYALARI VA KOMMUNIKATSIYALARINI RIVOJLANTIRISH VAZIRLIGI MUHAMMAD AL-XORAZMIY NOMIDAGI TOSHKENT AXBOROT TEXNOLOGIYALARI UNIVERSITETI
Axatov Asadbekning Tabbiy tilni qayta tiklash fanidan “Matnni avtomatik qayta ishlash sistemasi modullarini yaratish” mavzusida tayyorlagan 1-labaratoriya ishi
Bajardi: Axatov Asadbek
Tekshirdi: Abjalova Manzura
1- LABORATORIYA ISHI
Ishni bajarish tartibi
KOD:
from bs4 import BeautifulSoup
import requests
from csv import writer
soz = input('So\'zni kiriting:')
soz = soz.lower()
def expand_shortcuts(sentence, shortcuts_dict):
words = sentence.split()
expanded_sentence = []
changed_words = {}
for word in words:
lowercase_word = word.lower()
expanded_word = shortcuts_dict.get(lowercase_word, word)
if expanded_word != word:
changed_words[word] = expanded_word
expanded_sentence.append(expanded_word)
return ' '.join(expanded_sentence), changed_words
shortcuts_dict = {
"asad":"ASAD",
"baa":"BAA",
"rc":"RC",
"kxdr":"KXDR",
"hp":"HP",
"unicef":"UNICEF",
"dxx":"DXX",
"buxdu":"BuxDU",
"bmt": "BMT",
"aqsh": "AQSH",
"iiv":"IIV",
"xtb":"XTB",
"xdp":"XDP",
"dtm" : "DTM",
"tatu":"TATU",
"xxr":"XXR",
"toshdiu":"ToshDIU",
"mchj":"MCHJ",
"yunesko":"YUNESKO",
"it":"IT",
"o'zmu":"O`zMU",
"o'zas":"O`zAS",
"ayoqsh":"AYOQSH",
"yaim":"YaIM",
"fish":"FISH",
"mdh":"MDH",
"duk":"DUK",
"rf":"RF",
}
expanded_sentence , changed = expand_shortcuts(soz.lower(), shortcuts_dict)
print("Natija : ", expanded_sentence)
for original_word, expanded_word in changed.items():
print(f"{original_word} -> {expanded_word}")
html_text = requests.get('https://kun.uz/uz/news/category/uzbekiston').text
soup = BeautifulSoup(html_text, 'lxml')
jobs = soup.find_all('div', class_='col-md-4 mb-25 l-item')
m = 0
topildimi = 'No'
for job in jobs:
m += 1
print(m)
name = job.find('a', class_='news__title').text
link = 'https://kun.uz/uz/'.replace('/uz/', job.find('a', class_='news__title')['href'])
html_text_0 = requests.get(link).text
soup_0 = BeautifulSoup(html_text_0, 'lxml')
content = soup_0.find('div', class_='single-content')
p_tags = content.find_all('p')
p_tezis = content.find_all('h4')
title = ''
tezis = ''
for tit in p_tags:
title += tit.text.lower()
for tez in p_tezis:
tezis += tez.text
if soz in title.lower() or soz in tezis.lower():
print("\nSo'z to'g'ri yozilgan\n")
if soz in title.lower():
print(f"So'z qatnashgan maqola:\nBajardi: Axatov Asadbek ")
topildimi = 'yes'
else:
print(f"So'z qatnashgan maqola:\n{tezis} ")
topildimi = 'yes'
break
if topildimi != 'yes':
print("Siz kiritgan so'z topilmadi. Kiritgan so'zingiz to'g'ri bo'lmasligi mumkin. Tekshirib ko'ring")
Natija:
So’zlar avvalo bazadan, bo’lmasa kun.uz rasmiy saytidan ma’lumot oladi!
|
| |