728x90
๋ฐ์ํ
์ค์น
!pip install konlpy
ํ๋๋(Hannanum)
from konlpy.tag import Hannanum
hannanum = Hannanum()
text = '์๋
ํ์ธ์! ์ค๋ ๋ง์ด ์ถ์์'
print(hannanum.morphs(text)) # Parse phrase to morphemes
print(hannanum.nouns(text)) # Noun extractors
print(hannanum.pos(text)) # POS tagger
['์๋
', 'ํ', '์ธ', '์', '!', '์ค๋', '๋ง', '์ด', '์ถฅ', '์ด์']
['์๋
', '์ค๋']
[('์๋
', 'N'), ('ํ', 'X'), ('์ธ', 'E'), ('์', 'J'), ('!', 'S'), ('์ค๋', 'N'), ('๋ง', 'P'), ('์ด', 'X'), ('์ถฅ', 'P'), ('์ด์', 'E')]
๊ผฌ๊ผฌ๋ง
from konlpy.tag import Kkma
kkma = Kkma()
text = '์๋
ํ์ธ์! ์ค๋์ ๋ง์ด ์ถ์์'
print(kkma.morphs(text)) # Parse phrase to morphemes
print(kkma.nouns(text)) # Noun extractors
print(kkma.pos(text)) # POS tagger
['์๋
', 'ํ', '์ธ์', '!', '์ค๋', '์', '๋ง์ด', '์ถฅ', '์ด์']
['์๋
', '์ค๋']
[('์๋
', 'NNG'), ('ํ', 'XSV'), ('์ธ์', 'EFN'), ('!', 'SF'), ('์ค๋', 'NNG'), ('์', 'JX'), ('๋ง์ด', 'MAG'), ('์ถฅ', 'VA'), ('์ด์', 'EFN')]
Khaiii
!git clone https://github.com/kakao/khaiii.git
!pip install cmake
!mkdir build
!cd build && cmake /content/khaiii
!cd /content/build/ && make all
!cd /content/build/ && make resource
!cd /content/build && make install
!cd /content/build && make package_python
!pip install /content/build/package_python
from khaiii import KhaiiiApi
khaiiApi = KhaiiiApi()
tokenized = khaiiApi.analyze('์ฝ๋ฉ๊ณผ AI ๊ฐ๋ฐ์ด ๋๋ค ๊ฐ๋ฅํ ์ฌ๋์ ๋ง์ง ์๋ค.')
tokens = []
for word in tokenized:
tokens.extend([str(m).split('/')[0] for m in word.morphs])
print(tokens)
๋ฐ์ํ
'์์ฐ์ด ์ฒ๋ฆฌ > Today I learned :' ์นดํ ๊ณ ๋ฆฌ์ ๋ค๋ฅธ ๊ธ
[์์ฐ์ด ์ฒ๋ฆฌ] ๋ง์ถค๋ฒ ์ ์ฒ๋ฆฌ ๊ต์ Py-Hanspell ์์ (0) | 2023.01.03 |
---|---|
[์์ฐ์ด ์ฒ๋ฆฌ]์ ์ฒ๋ฆฌ ๋์ด์ฐ๊ธฐ ๊ต์ ์์ PyKoSpacing ์์ (0) | 2023.01.03 |
[์์ฐ์ด ์ฒ๋ฆฌ]ํ๊ตญ์ด ์ ์ฒ๋ฆฌ re (0) | 2023.01.03 |
[์์ฐ์ด์ฒ๋ฆฌ] ํ ์คํธ ์ ์ฒ๋ฆฌ(Text Preprocessing) (1) | 2023.01.03 |
PYTORCH(ํ์ดํ ์น) cheatsheet (0) | 2022.12.12 |