This is a pytorch implementaion of the pervasive attention model: Arxiv
pip install tensorboardX h5py
cd data
./prepare-iwslt14.sh
cd ..
python preprocess.py -d iwslt14
mkdir -p save events
python train.py -c config/l24.yaml
python generate.py -c config/l24.yaml -b 5