paraphrase#

Funpedia#

Extract from https://github.com/facebookresearch/ParlAI/tree/master/parlai/tasks/funpedia

Original paper, https://arxiv.org/abs/1705.06476

Citation#

@misc{miller2018parlai,
title={ParlAI: A Dialog Research Software Platform},
author={Alexander H. Miller and Will Feng and Adam Fisch and Jiasen Lu and Dhruv Batra and Antoine Bordes and Devi Parikh and Jason Weston},
year={2018},
eprint={1705.06476},
archivePrefix={arXiv},
primaryClass={cs.CL}
}

MSCOCO#

Extract from MS COCO Captions, https://github.com/tensorflow/tensor2tensor/blob/master/tensor2tensor/data_generators/paraphrase_ms_coco.py

Original paper, http://arxiv.org/abs/1405.0312

Citation#

@article{DBLP:journals/corr/LinMBHPRDZ14,
author    = {Tsung{-}Yi Lin and
Michael Maire and
Serge J. Belongie and
Lubomir D. Bourdev and
Ross B. Girshick and
James Hays and
Pietro Perona and
Deva Ramanan and
Piotr Doll{\'{a}}r and
C. Lawrence Zitnick},
title     = {Microsoft {COCO:} Common Objects in Context},
journal   = {CoRR},
volume    = {abs/1405.0312},
year      = {2014},
url       = {http://arxiv.org/abs/1405.0312},
archivePrefix = {arXiv},
eprint    = {1405.0312},
timestamp = {Mon, 13 Aug 2018 16:48:13 +0200},
biburl    = {https://dblp.org/rec/journals/corr/LinMBHPRDZ14.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}

PAWS#

Original website, https://github.com/google-research-datasets/paws

Original paper, https://arxiv.org/abs/1904.01130

Citation#

@misc{zhang2019paws,
title={PAWS: Paraphrase Adversaries from Word Scrambling},
author={Yuan Zhang and Jason Baldridge and Luheng He},
year={2019},
eprint={1904.01130},
archivePrefix={arXiv},
primaryClass={cs.CL}
}

Semisupervised Academia.edu#

Use Malaya T5-Base Paraphrase model to paraphrase https://github.com/huseinzol05/Malay-Dataset#academia-pdf

Citation#

@misc{Malay-Dataset, We gather Bahasa Malaysia corpus!, Semisupervised Academia.edu Paraphrases using T5-Bahasa,
author = {Husein, Zolkepli},
title = {Malay-Dataset},
year = {2018},
publisher = {GitHub},
journal = {GitHub repository},
howpublished = {\url{https://github.com/huseinzol05/malay-dataset/tree/master/paraphrase/semisupervised-academia}}
}

Semisupervised News#

Use Malaya T5-Base Paraphrase model to paraphrase https://github.com/huseinzol05/Malay-Dataset#crawled-news

Citation#

@misc{Malay-Dataset, We gather Bahasa Malaysia corpus!, Semisupervised Bahasa News Paraphrases using T5-Bahasa,
author = {Husein, Zolkepli},
title = {Malay-Dataset},
year = {2018},
publisher = {GitHub},
journal = {GitHub repository},
howpublished = {\url{https://github.com/huseinzol05/malay-dataset/tree/master/paraphrase/semisupervised-academia}}
}

Semisupervised Wikipedia#

Use Malaya T5-Base Paraphrase model to paraphrase https://github.com/huseinzol05/Malay-Dataset#wikipedia

Citation#

@misc{Malay-Dataset, We gather Bahasa Malaysia corpus!, Semisupervised Bahasa Wikipedia Paraphrases using T5-Bahasa,
author = {Husein, Zolkepli},
title = {Malay-Dataset},
year = {2018},
publisher = {GitHub},
journal = {GitHub repository},
howpublished = {\url{https://github.com/huseinzol05/malay-dataset/tree/master/paraphrase/semisupervised-academia}}
}