-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathreferences.bib
138 lines (127 loc) · 9.09 KB
/
references.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
@incollection{stefanowitsch_cognitive_2011,
address = {Amsterdam/Philadelphia},
title = {Cognitive linguistics meets the corpus},
booktitle = {Cognitive {Linguistics}: {Convergence} and {Expansion}},
publisher = {John Benjamins Publishing Company},
author = {Stefanowitsch, Anatol},
editor = {Brdar, Mario and Gries, Stefan Th. and Fuchs, Milena Žic},
year = {2011},
pages = {257--289}
}
@manual{Rajeg_Constructional_equivalence_in_2021,
author = {Rajeg, Gede Primahadi Wijaya},
doi = {10.17605/OSF.IO/PZC8Y},
license = {CC BY-NC-SA 4.0 International},
month = {12},
title = {{Constructional equivalence in the Indonesian translations of ROB and STEAL}},
url = {https://github.com/gederajeg/constructional-equivalence},
version = {0.0.1},
year = {2021}
}
@book{levshina_how_2015,
address = {Amsterdam},
title = {How to do {Linguistics} with {R}: {Data} exploration and statistical analysis},
isbn = {978-90-272-6845-7},
shorttitle = {How to do {Linguistics} with {R}},
abstract = {This book provides a linguist with a statistical toolkit for exploration and analysis of linguistic data. It employs R, a free software environment for statistical computing, which is increasingly popular among linguists. How to do Linguistics with R: Data exploration and statistical analysis is unique in its scope, as it covers a wide range of classical and cutting-edge statistical methods, including different flavours of regression analysis and ANOVA, random forests and conditional inference trees, as well as specific linguistic approaches, among which are Behavioural Profiles, Vector Space Models and various measures of association between words and constructions. The statistical topics are presented comprehensively, but without too much technical detail, and illustrated with linguistic case studies that answer non-trivial research questions. The book also demonstrates how to visualize linguistic data with the help of attractive informative graphs, including the popular ggplot2 system and Google visualization tools.},
language = {en},
publisher = {John Benjamins Publishing Company},
author = {Levshina, Natalia},
month = nov,
year = {2015},
keywords = {Language Arts \& Disciplines / Linguistics / General, LANGUAGE ARTS \& DISCIPLINES / Linguistics / General, Computers / Natural Language Processing}
}
@book{goldberg_constructions_1995,
address = {Chicago},
title = {Constructions: {A} construction grammar approach to argument structure},
isbn = {978-0-226-30085-6 978-0-226-30086-3},
shorttitle = {Constructions},
publisher = {University of Chicago Press},
author = {Goldberg, Adele E.},
year = {1995},
keywords = {Syntax, Semantics, Grammar, Comparative and general, construction grammar, Construction grammar, SEMANTICS}
}
@inproceedings{tiedemann_finding_2016,
address = {Portorož, Slovenia},
title = {Finding {Alternative} {Translations} in a {Large} {Corpus} of {Movie} {Subtitle}},
url = {https://www.aclweb.org/anthology/L16-1559},
abstract = {OpenSubtitles.org provides a large collection of user contributed subtitles in various languages for movies and TV programs. Subtitle translations are valuable resources for cross-lingual studies and machine translation research. A less explored feature of the collection is the inclusion of alternative translations, which can be very useful for training paraphrase systems or collecting multi-reference test suites for machine translation. However, differences in translation may also be due to misspellings, incomplete or corrupt data files, or wrongly aligned subtitles. This paper reports our efforts in recognising and classifying alternative subtitle translations with language independent techniques. We use time-based alignment with lexical re-synchronisation techniques and BLEU score filters and sort alternative translations into categories using edit distance metrics and heuristic rules. Our approach produces large numbers of sentence-aligned translation alternatives for over 50 languages provided via the OPUS corpus collection.},
urldate = {2020-11-07},
booktitle = {Proceedings of the {Tenth} {International} {Conference} on {Language} {Resources} and {Evaluation} ({LREC}'16)},
publisher = {European Language Resources Association (ELRA)},
author = {Tiedemann, Jörg},
month = may,
year = {2016},
pages = {3518--3522},
file = {Tiedemann_2016_Finding Alternative Translations in a Large Corpus of Movie Subtitle.pdf:/Users/Primahadi/Documents/_Zotero Digital Library/Conference Paper/Tiedemann_2016_Finding Alternative Translations in a Large Corpus of Movie Subtitle.pdf:application/pdf},
}
@inproceedings{tiedemann_parallel_2012,
address = {Istanbul, Turkey},
title = {Parallel {Data}, {Tools} and {Interfaces} in {OPUS}},
url = {http://www.lrec-conf.org/proceedings/lrec2012/pdf/463_Paper.pdf},
abstract = {This paper presents the current status of OPUS, a growing language resource of parallel corpora and related tools. The focus in OPUS is to provide freely available data sets in various formats together with basic annotation to be useful for applications in computational linguistics, translation studies and cross-linguistic corpus studies. In this paper, we report about new data sets and their features, additional annotation tools and models provided from the website and essential interfaces and on-line services included in the project.},
urldate = {2021-11-07},
booktitle = {Proceedings of the {Eighth} {International} {Conference} on {Language} {Resources} and {Evaluation} ({LREC}'12)},
publisher = {European Language Resources Association (ELRA)},
author = {Tiedemann, Jörg},
month = may,
year = {2012},
pages = {2214--2218},
file = {Tiedemann_2012_Parallel Data, Tools and Interfaces in OPUS.pdf:/Users/Primahadi/Documents/_Zotero Digital Library/Conference Paper/Tiedemann_2012_Parallel Data, Tools and Interfaces in OPUS.pdf:application/pdf},
}
@inproceedings{tiedemann_opus_2016,
address = {Riga, Latvia},
title = {{OPUS} – parallel corpora for everyone},
url = {https://aclanthology.org/2016.eamt-2.8},
urldate = {2021-11-07},
booktitle = {Proceedings of the 19th {Annual} {Conference} of the {European} {Association} for {Machine} {Translation}: {Projects}/{Products}},
publisher = {Baltic Journal of Modern Computing},
author = {Tiedemann, Jörg},
month = may,
year = {2016},
file = {Tiedemann_2016_OPUS – parallel corpora for everyone.pdf:/Users/Primahadi/Documents/_Zotero Digital Library/Conference Paper/Tiedemann_2016_OPUS – parallel corpora for everyone.pdf:application/pdf},
}
@inproceedings{lison_opensubtitles2016_2016,
address = {Portorož, Slovenia},
title = {Opensubtitles2016: {Extracting} large parallel corpora from movie and tv subtitles},
shorttitle = {Opensubtitles2016},
booktitle = {Proceedings of the {Tenth} {International} {Conference} on {Language} {Resources} and {Evaluation} ({LREC}'16)},
publisher = {European Language Resources Association (ELRA)},
author = {Lison, Pierre and Tiedemann, Jörg},
year = {2016},
note = {Publisher: European Language Resources Association},
pages = {923--929},
file = {Lison_Tiedemann_2016_Opensubtitles2016.pdf:/Users/Primahadi/Documents/_Zotero Digital Library/Journal Article/Lison_Tiedemann_2016_Opensubtitles2016.pdf:application/pdf},
}
@article{rajeg_material_2021,
title = {Material pendukung untuk \textit{{MODEL} {KAJIAN} {TERJEMAHAN} {BERBASIS} {BANK} {DATA} {TERJEMAHAN} {DIGITAL} {INGGRIS}-{INDONESIA} {DAN} {IMPLIKASI} {PEDAGOGISNYA}}},
url = {https://osf.io/y6esa/},
doi = {10.17605/OSF.IO/Y6ESA},
abstract = {Repositori data dan kode pemrograman untuk Penelitian Unggulan Program Studi (PUPS) dengan judul MODEL KAJIAN TERJEMAHAN BERBASIS BANK DATA TERJEMAHAN DIGITAL INGGRIS-INDONESIA DAN IMPLIKASI PEDAGOGISNYA. Objek kajian yang menjadi fokus penelitian ini adalah verba sinonim bahasa Inggris ROB dan STEAL serta padanannya dalam bahasa Indonesia. Sumber data yang digunakan adalah korpus paralel (Bahasa Inggris - Bahasa Indonesia) bernama OpenSubtitles-v2018 (https://opus.nlpl.eu/OpenSubtitles-v2018.php).
Hosted on the Open Science Framework},
language = {en},
publisher = {Open Science Framework},
author = {Rajeg, Gede Primahadi Wijaya and Rajeg, I Made and Kartini, Putu Dea Indah and Putra, I Gede Semara Dharma},
month = nov,
year = {2021},
note = {Publisher: OSF},
}
@misc{rajeg_pemanfaatan_2021,
type = {Paper},
title = {Pemanfaatan {Bank}-data {Digital} {Dwibahasa} dalam {Kajian} {Terjemahan}: {Studi} kasus padanan bahasa {Indonesia} untuk verba sinonim bahasa {Inggris} {ROB} \& {STEAL}},
copyright = {All rights reserved},
shorttitle = {Pemanfaatan {Bank}-data {Digital} {Dwibahasa} dalam {Kajian} {Terjemahan}},
url = {https://github.com/gederajeg/rob-steal-parallel-corpora},
author = {Rajeg, Gede Primahadi Wijaya and Rajeg, I Made and Kartini, Putu Dea Indah and Putra, I Gede Semara Dharma},
year = {2021},
doi = {10.6084/m9.figshare.17078369},
}
@Manual{rajeg_paracorp_2021,
title = {paracorp: A concordancer for parallel, bilingual corpora},
author = {Gede Primahadi Wijaya Rajeg},
year = {2021},
doi = {10.17605/OSF.IO/HV9CU},
publisher = {GitHub and Open Science Framework (OSF)},
url = {https://github.com/gederajeg/paracorp},
note = {R package version 0.0.1},
}