- create conda enviroment with Python=3.10
conda create -n clipgrasp python=3.10
conda activate clipgrasp
- install pytorch 1.13.0, torchvision 0.14.0 with compatible cuda version (or any compatible torch version)
conda install pytorch==1.13.0 torchvision==0.14.0 torchaudio==0.13.0 pytorch-cuda=11.7 -c pytorch -c nvidia
- install required package
pip install -r requirements.txt
python demo.py --text_query "Can you give me something to drink?"