sudo apt update
sudo apt install -y openjdk-17-jdk python3-pip python3-venv git curl
# 下载社区版 (免费)
wget https://download.jetbrains.com/idea/ideaIC-2023.2.tar.gz -O idea.tar.gz
# 解压并安装
sudo tar -xzf idea.tar.gz -C /opt/
sudo mv /opt/idea-IC-* /opt/idea
# 创建启动器
echo "[Desktop Entry]
Name=IntelliJ IDEA
Type=Application
Exec=/opt/idea/bin/idea.sh
Terminal=false
Icon=/opt/idea/bin/idea.png
Comment=IntelliJ IDEA
NoDisplay=false
Categories=Development;IDE;" > ~/.local/share/applications/idea.desktop
chmod +x ~/.local/share/applications/idea.desktop
mkdir ~/nlp_projects
cd ~/nlp_projects
python3 -m venv nlp_env
source nlp_env/bin/activate
pip install --upgrade pip
pip install numpy pandas matplotlib seaborn
pip install jupyter notebook ipykernel
pip install nltk spacy gensim scikit-learn
pip install torch torchvision torchaudio
pip install transformers datasets sentencepiece
python -m nltk.downloader all
python -m spacy download en_core_web_sm
~/nlp_projects
nlp_env
~/nlp_projects/nlp_env/bin/python3
pip install transformers
huggingface-cli login # 按提示输入 Hugging Face 账户令牌
# 安装 CUDA 工具包 (Ubuntu 示例)
sudo apt install -y nvidia-cuda-toolkit
# 验证安装
nvcc --version
# 安装 GPU 版本 PyTorch (根据 CUDA 版本选择)
pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu118
PYTHONPATH=项目根目录
创建常用 NLP 代码模板: 1. Settings > Editor > Live Templates 2. 添加 Python 组 3. 创建如 "nlp-load-text"、"nlp-tokenize" 等模板
创建测试文件 test_nlp.py
:
import nltk
from transformers import pipeline
# 测试 NLTK
print("NLTK 测试:", nltk.word_tokenize("Hello NLP world!"))
# 测试 Transformers
classifier = pipeline("sentiment-analysis")
print("情感分析:", classifier("I love using IntelliJ IDEA for NLP projects!"))
运行成功即表示基本 NLP 环境配置完成。