From e6894584e36f8e4ffbfbb5f1bfa2fa41a224a84d Mon Sep 17 00:00:00 2001 From: Luis Date: Sat, 13 Jul 2019 15:57:07 -0400 Subject: [PATCH 1/5] add bibliography --- bibliography/README.md | 6 + bibliography/SIGMathLing.bib | 239 +++++++++++++++++++++++++++++++++++ 2 files changed, 245 insertions(+) create mode 100644 bibliography/README.md create mode 100644 bibliography/SIGMathLing.bib diff --git a/bibliography/README.md b/bibliography/README.md new file mode 100644 index 0000000..3b43b47 --- /dev/null +++ b/bibliography/README.md @@ -0,0 +1,6 @@ +## SIGMathLing Common Bibliography + +This is common bibliography for the SIGMathLing group. Topics of interest include: + +* Natural Language Processing/Computational Linguistics +* Mathematical Knowledge Management diff --git a/bibliography/SIGMathLing.bib b/bibliography/SIGMathLing.bib new file mode 100644 index 0000000..c82a4d4 --- /dev/null +++ b/bibliography/SIGMathLing.bib @@ -0,0 +1,239 @@ +@article{chen2017improving, + title={Improving sentiment analysis via sentence type classification using BiLSTM-CRF and CNN}, + author={Chen, Tao and Xu, Ruifeng and He, Yulan and Wang, Xuan}, + journal={Expert Systems with Applications}, + volume={72}, + pages={221--230}, + year={2017}, + publisher={Elsevier} +} + +@inproceedings{saggion, + title={Identifying Definitions in Text Collections for Question Answering.}, + author={Saggion, Horacio}, + booktitle={LREC}, + year={2004} +} + +@book{lange2011enabling, + title={Enabling collaboration on semiformal mathematical knowledge by semantic web integration}, + author={Lange, Christoph}, + volume={11}, + year={2011}, + publisher={IOS Press} +} + +@Article{Alama2014, +author="Alama, Jesse +and Heskes, Tom +and K{\"u}hlwein, Daniel +and Tsivtsivadze, Evgeni +and Urban, Josef", +title="Premise Selection for Mathematics by Corpus Analysis and Kernel Methods", +journal="Journal of Automated Reasoning", +year="2014", +month="Feb", +day="01", +volume="52", +number="2", +pages="191--213", +abstract="Smart premise selection is essential when using automated reasoning as a tool for large-theory formal proof development. This work develops learning-based premise selection in two ways. First, a fine-grained dependency analysis of existing high-level formal mathematical proofs is used to build a large knowledge base of proof dependencies, providing precise data for ATP-based re-verification and for training premise selection algorithms. Second, a new machine learning algorithm for premise selection based on kernel methods is proposed and implemented. To evaluate the impact of both techniques, a benchmark consisting of 2078 large-theory mathematical problems is constructed, extending the older MPTP Challenge benchmark. The combined effect of the techniques results in a 50 {\%} improvement on the benchmark over the state-of-the-art Vampire/SInE system for automated reasoning in large theories.", +issn="1573-0670", +doi="10.1007/s10817-013-9286-5", +url="https://doi.org/10.1007/s10817-013-9286-5" +} + + +@article{bengio2003neural, +title={A neural probabilistic language model}, +author={Bengio, Yoshua and Ducharme, R{\'e}jean and Vincent, Pascal and Jauvin, Christian}, +journal={Journal of machine learning research}, +volume={3}, + number={Feb}, + pages={1137--1155}, + year={2003} +} + +@InProceedings{bagof, +author = "Joulin, Armand +and Grave, Edouard +and Bojanowski, Piotr +and Mikolov, Tomas", +title = "Bag of Tricks for Efficient Text Classification", +booktitle = "Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics: Volume 2, Short Papers", +year = "2017", +publisher = "Association for Computational Linguistics", +pages = "427--431", +location = "Valencia, Spain", +url = "http://aclweb.org/anthology/E17-2068" +} + +@article{pang2008opinion, + title={Opinion mining and sentiment analysis}, + author={Pang, Bo and Lee, Lillian and others}, + journal={Foundations and Trends{\textregistered} in Information Retrieval}, + volume={2}, + number={1--2}, + pages={1--135}, + year={2008}, + publisher={Now Publishers, Inc.} +} + +@article{bojanowski2017enriching, + title={Enriching Word Vectors with Subword Information}, + author={Bojanowski, Piotr and Grave, Edouard and Joulin, Armand and Mikolov, Tomas}, + journal={Transactions of the Association for Computational Linguistics}, + volume={5}, + year={2017}, + issn={2307-387X}, + pages={135--146} +} + +@inproceedings{murphy2003phrase, + title={Phrase detection and the associative memory neural network}, + author={Murphy, Richard C}, + booktitle={Proceedings of the International Joint Conference on Neural Networks, 2003.}, + volume={4}, + pages={2599--2603}, + year={2003}, + organization={IEEE} +} + +@article{cho2014learning, + title={Learning phrase representations using RNN encoder-decoder for statistical machine translation}, + author={Cho, Kyunghyun and Van Merri{\"e}nboer, Bart and Gulcehre, Caglar and Bahdanau, Dzmitry and Bougares, Fethi and Schwenk, Holger and Bengio, Yoshua}, + journal={arXiv preprint arXiv:1406.1078}, + year={2014} +} + +@inproceedings{huang2012improving, + title={Improving word representations via global context and multiple word prototypes}, + author={Huang, Eric H and Socher, Richard and Manning, Christopher D and Ng, Andrew Y}, + booktitle={Proceedings of the 50th Annual Meeting of the Association for Computational Linguistics: Long Papers-Volume 1}, + pages={873--882}, + year={2012}, + organization={Association for Computational Linguistics} +} + +@article{sunsimple, + title={A Simple Approach to Learn Polysemous Word Embeddings}, + author={Sun, Yifan and Rao, Nikhil and Ding, Weicong}, + journal={arXiv preprint arXiv:1707.01793}, + year={2017} +} + +@online{SML, + author = {Deyan Ginev}, + title = {arXMLiv:08.2018 dataset, an HTML5 conversion of arXiv.org}, + url = {https://sigmathling.kwarc.info/resources/arxmliv/}, + note = {SIGMathLing -- Special Interest Group on Math Linguistics}, + year = {2018}} + +@misc{fabs, + title = {Formal Abstracts}, + howpublished = {https://formalabstracts.github.io/}, + year = {2019}} + +@misc{webscipara, + author = {Deyan Ginev}, + title = {A Web Demo for Scientific Paragraph Classification }, + year = {2018}, + publisher = {GitHub}, + journal = {GitHub repository}, + howpublished = {\url{https://github.com/dginev/web-scipara-demo}}, + commit = {1937a1754c7376dc5f34292feaa2ff77115d2ca2} +} + +@article{transforming, + title={Transforming large collections of scientific publications to XML}, + author={Stamerjohanns, Heinrich and Kohlhase, Michael and Ginev, Deyan and David, Catalin and Miller, Bruce}, + journal={Mathematics in Computer Science}, + volume={3}, + number={3}, + pages={299--307}, + year={2010}, + publisher={Springer} +} + +@article{scikit-learn, + title={Scikit-learn: Machine Learning in {P}ython}, + author={Pedregosa, F. and Varoquaux, G. and Gramfort, A. and Michel, V. + and Thirion, B. and Grisel, O. and Blondel, M. and Prettenhofer, P. + and Weiss, R. and Dubourg, V. and Vanderplas, J. and Passos, A. and + Cournapeau, D. and Brucher, M. and Perrot, M. and Duchesnay, E.}, + journal={Journal of Machine Learning Research}, + volume={12}, + pages={2825--2830}, + year={2011} +} +@article{miller3latexml, + title={LaTeXML: A Latex to XML Converter. url: http://dlmf. nist. gov}, + author={Miller, Bruce}, + howpublished = {\url{https://dlmf.nist.gov/LaTeXML/}}, + year={2013}, + journal={LaTeXML/(visited on 03/12/2013)} +} + +@inproceedings{pennington2014glove, + title={Glove: Global vectors for word representation}, + author={Pennington, Jeffrey and Socher, Richard and Manning, Christopher}, + booktitle={Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP)}, + pages={1532--1543}, + year={2014} +} + + +@article{nersurvey, + title={A survey of named entity recognition and classification}, + author={Nadeau, David and Sekine, Satoshi}, + journal={Lingvisticae Investigationes}, + volume={30}, + number={1}, + pages={3--26}, + year={2007}, + publisher={John Benjamins} +} + +@article{nltk, + author = {Edward Loper and + Steven Bird}, + title = {{NLTK:} The Natural Language Toolkit}, + journal = {CoRR}, + volume = {cs.CL/0205028}, + year = {2002}, + url = {http://arxiv.org/abs/cs.CL/0205028}, + timestamp = {Mon, 13 Aug 2018 16:48:22 +0200}, + biburl = {https://dblp.org/rec/bib/journals/corr/cs-CL-0205028}, + bibsource = {dblp computer science bibliography, https://dblp.org} +} + +@inproceedings{domainAdaptation, + title={Instance weighting for domain adaptation in NLP}, + author={Jiang, Jing and Zhai, ChengXiang}, + booktitle={Proceedings of the 45th annual meeting of the association of computational linguistics}, + pages={264--271}, + year={2007} +} + +@article{DBLP:journals/corr/SchakelW15, + author = {Adriaan M. J. Schakel and + Benjamin J. Wilson}, + title = {Measuring Word Significance using Distributed Representations of Words}, + journal = {CoRR}, + volume = {abs/1508.02297}, + year = {2015}, + url = {http://arxiv.org/abs/1508.02297}, + archivePrefix = {arXiv}, + eprint = {1508.02297}, + timestamp = {Mon, 13 Aug 2018 16:47:39 +0200}, + biburl = {https://dblp.org/rec/bib/journals/corr/SchakelW15}, + bibsource = {dblp computer science bibliography, https://dblp.org} +} + +@article{article, +author = {Jiang, Jing}, +year = {2008}, +month = {01}, +pages = {}, +title = {Domain Adaptation in Natural Language Processing} +} -- GitLab From a7b048910730ef2c81de6baaa2c9a35ddca4e248 Mon Sep 17 00:00:00 2001 From: Luis Date: Sat, 13 Jul 2019 17:03:00 -0400 Subject: [PATCH 2/5] add nocite --- bibliography/Makefile | 11 +++++++++++ bibliography/README.md | 2 ++ bibliography/SIGMathLing.bib | 16 +--------------- bibliography/SIGMathLing.tex | 7 +++++++ 4 files changed, 21 insertions(+), 15 deletions(-) create mode 100644 bibliography/Makefile create mode 100644 bibliography/SIGMathLing.tex diff --git a/bibliography/Makefile b/bibliography/Makefile new file mode 100644 index 0000000..9d4b413 --- /dev/null +++ b/bibliography/Makefile @@ -0,0 +1,11 @@ +filename=SIGMathLing + +pdf: + pdflatex ${filename}.tex + bibtex ${filename}.aux + pdflatex ${filename}.tex + pdflatex ${filename}.tex + + +clean: + rm ${filename}.{pdf,log,aux,bbl,blg} diff --git a/bibliography/README.md b/bibliography/README.md index 3b43b47..130725a 100644 --- a/bibliography/README.md +++ b/bibliography/README.md @@ -4,3 +4,5 @@ This is common bibliography for the SIGMathLing group. Topics of interest includ * Natural Language Processing/Computational Linguistics * Mathematical Knowledge Management + + diff --git a/bibliography/SIGMathLing.bib b/bibliography/SIGMathLing.bib index c82a4d4..89c5aee 100644 --- a/bibliography/SIGMathLing.bib +++ b/bibliography/SIGMathLing.bib @@ -122,27 +122,12 @@ url = "http://aclweb.org/anthology/E17-2068" year={2017} } -@online{SML, - author = {Deyan Ginev}, - title = {arXMLiv:08.2018 dataset, an HTML5 conversion of arXiv.org}, - url = {https://sigmathling.kwarc.info/resources/arxmliv/}, - note = {SIGMathLing -- Special Interest Group on Math Linguistics}, - year = {2018}} @misc{fabs, title = {Formal Abstracts}, howpublished = {https://formalabstracts.github.io/}, year = {2019}} -@misc{webscipara, - author = {Deyan Ginev}, - title = {A Web Demo for Scientific Paragraph Classification }, - year = {2018}, - publisher = {GitHub}, - journal = {GitHub repository}, - howpublished = {\url{https://github.com/dginev/web-scipara-demo}}, - commit = {1937a1754c7376dc5f34292feaa2ff77115d2ca2} -} @article{transforming, title={Transforming large collections of scientific publications to XML}, @@ -237,3 +222,4 @@ month = {01}, pages = {}, title = {Domain Adaptation in Natural Language Processing} } + diff --git a/bibliography/SIGMathLing.tex b/bibliography/SIGMathLing.tex new file mode 100644 index 0000000..a52fb7a --- /dev/null +++ b/bibliography/SIGMathLing.tex @@ -0,0 +1,7 @@ +\documentclass{article} + +\begin{document} +\nocite{*} +\bibliographystyle{plain} +\bibliography{SIGMathLing} +\end{document} -- GitLab From e53988d3570e94d9d447383ad68efa67cf9ef3a1 Mon Sep 17 00:00:00 2001 From: Luis Date: Sun, 14 Jul 2019 07:10:44 -0400 Subject: [PATCH 3/5] add some comments and instructions --- bibliography/README.md | 5 +++++ bibliography/SIGMathLing.tex | 7 +++++++ 2 files changed, 12 insertions(+) diff --git a/bibliography/README.md b/bibliography/README.md index 130725a..9bc295b 100644 --- a/bibliography/README.md +++ b/bibliography/README.md @@ -4,5 +4,10 @@ This is common bibliography for the SIGMathLing group. Topics of interest includ * Natural Language Processing/Computational Linguistics * Mathematical Knowledge Management +* Please include any requests in the issues page. + +### Options for Makefile +* make -- creates a .pdf file with the nocite{*} option. +* make clean -- removes the latex processing files diff --git a/bibliography/SIGMathLing.tex b/bibliography/SIGMathLing.tex index a52fb7a..5d95daf 100644 --- a/bibliography/SIGMathLing.tex +++ b/bibliography/SIGMathLing.tex @@ -1,3 +1,10 @@ +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% +% +% SIGMathLing Bibliography +% Send any requests or additions to the Gitlab issues page +% +%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% + \documentclass{article} \begin{document} -- GitLab From 636abceba0bbf75e958de5515ed1baed359cc678 Mon Sep 17 00:00:00 2001 From: Luis Date: Mon, 15 Jul 2019 21:34:16 -0400 Subject: [PATCH 4/5] update .gitignore rule for latex accesory files --- .gitignore | 7 +++++++ 1 file changed, 7 insertions(+) diff --git a/.gitignore b/.gitignore index ed90730..8e7c009 100644 --- a/.gitignore +++ b/.gitignore @@ -1,2 +1,9 @@ _site Gemfile.lock + +# LaTeX files +bibliography/SIGMathLing.pdf +bibliography/SIGMathLing.log +bibliography/SIGMathLing.aux +bibliography/SIGMathLing.bbl +bibliography/SIGMathLing.blg -- GitLab From 07491f3a3fa3b7a0522405222e8f0d2ef1e14f86 Mon Sep 17 00:00:00 2001 From: Luis Date: Wed, 17 Jul 2019 15:17:54 -0400 Subject: [PATCH 5/5] change README to index.md --- bibliography/SIGMathLing.bib | 10 ++++++++++ bibliography/{README.md => index.md} | 0 2 files changed, 10 insertions(+) rename bibliography/{README.md => index.md} (100%) diff --git a/bibliography/SIGMathLing.bib b/bibliography/SIGMathLing.bib index 89c5aee..023d9ec 100644 --- a/bibliography/SIGMathLing.bib +++ b/bibliography/SIGMathLing.bib @@ -223,3 +223,13 @@ pages = {}, title = {Domain Adaptation in Natural Language Processing} } +@article{tshitoyan2019unsupervised, + title={Unsupervised word embeddings capture latent knowledge from materials science literature}, + author={Tshitoyan, Vahe and Dagdelen, John and Weston, Leigh and Dunn, Alexander and Rong, Ziqin and Kononova, Olga and Persson, Kristin A and Ceder, Gerbrand and Jain, Anubhav}, + journal={Nature}, + volume={571}, + number={7763}, + pages={95}, + year={2019}, + publisher={Nature Publishing Group} +} diff --git a/bibliography/README.md b/bibliography/index.md similarity index 100% rename from bibliography/README.md rename to bibliography/index.md -- GitLab