sudo apt-get update
sudo apt-get upgrade -y
sudo apt-get dist-upgrade -y
sudo apt-get install python3 python3-pip screen git -y
CUDA_REPO_PKG=cuda-repo-ubuntu1804_10.0.130-1_amd64.deb
wget -O /tmp/${CUDA_REPO_PKG} http://developer.download.nvidia.com/compute/cuda/repos/ubuntu1804/x86_64/${CUDA_REPO_PKG}
sudo dpkg -i /tmp/${CUDA_REPO_PKG}
sudo apt-key adv --fetch-keys http://developer.download.nvidia.com/compute/cuda/repos/ubuntu1804/x86_64/7fa2af80.pub
rm -f /tmp/${CUDA_REPO_PKG}
sudo apt-get update
sudo apt-get install cuda-drivers
git clone https://github.com/hexvalid/ai-bdc
cd ai-bdc
pip3 install -r requirements.txt
python3 main.py --mode train --cuda True --lr 0.0001 --workers 16 --batch-size 128 --epoch 30
python3 main.py --mode train --cuda True --lr 0.0001 --workers 16 --batch-size 128 --epoch 50 --warm-up True
python3 main.py --mode train --cuda True --lr 0.00002 --workers 16 --batch-size 128 --epoch 10
- 1e-4 lr train 30-epoch for warm-up
- 2e-5 lr train about 10-epoch for fine tuning
- Deploy a Digitalocean's CPU optimized Debian 9 droplet
- Convert dropted to Arch Linux by using this script: https://github.com/gh2o/digitalocean-debian-to-arch
- Install dependencies:
pacman -S screen bash-completion go php php-cgi php-gd libjpeg libpng fontconfig
git clone https://github.com/hexvalid/ai-bdc
go get github.com/cheggaaa/pb/v3
cd ai-bdc/gen
mkdir out && mkdir /tmp/bdc_void/
- Change style (optional):
# Edit $STYLE=
# -1 mean random
nano php/botdetect-captcha-lib/botdetect/CaptchaIncludes.php
- Prepare PHP-CGI:
# Open up 10 php-cgi server via screen
php -c php/php.ini -t php/ -S 127.0.0.1:9000
php -c php/php.ini -t php/ -S 127.0.0.1:9001
php -c php/php.ini -t php/ -S 127.0.0.1:9002
......
php -c php/php.ini -t php/ -S 127.0.0.1:9009
- Run Generation Script:
# Check mode and count
# Run mode = 1 and mode = 2
# As twice!
nano gen.go
# run via screen
go run gen.go
- Package:
tar cfJ gendata-count250k-style18.tar.xz out/
- Clean:
rm /tmp/bdc_pipe && touch /tmp/bdc_pipe && rm -rf /tmp/bdc_void/ && mkdir /tmp/bdc_void/
- Publish
go get github.com/github-release/github-release
export GITHUB_TOKEN=...
go/bin/github-release upload --user hexvalid --repo ai-bdc --tag gendatas --name "gendata-count250k-style18.tar.xz" --file gendata-count250k-style18.tar.xz