-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathvrosenberg1853.bib
161 lines (145 loc) · 8.94 KB
/
vrosenberg1853.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
@article{VonRosenberg1853,
title = {De {{Mentawei-Eilanden}} En {{Hunne Bewoners}}},
author = {Von Rosenberg, Hermann},
year = {1853},
journal = {Tijdschrift voor Indische Taal-, Land- en Volkenkunde},
volume = {1},
pages = {403--440},
url = {https://www.digitale-sammlungen.de/en/view/bsb10433845?page=450,451}
}
@article{forkel_cross-linguistic_2018,
title = {Cross-{{Linguistic Data Formats}}, Advancing Data Sharing and Re-Use in Comparative Linguistics},
author = {Forkel, Robert and List, Johann-Mattis and Greenhill, Simon J. and Rzymski, Christoph and Bank, Sebastian and Cysouw, Michael and Hammarstr{\"o}m, Harald and Haspelmath, Martin and Kaiping, Gereon A. and Gray, Russell D.},
year = {2018},
month = oct,
journal = {Scientific Data},
volume = {5},
number = {1},
pages = {180205},
publisher = {Nature Publishing Group},
issn = {2052-4463},
doi = {10.1038/sdata.2018.205},
urldate = {2023-01-18},
abstract = {The amount of available digital data for the languages of the world is constantly increasing. Unfortunately, most of the digital data are provided in a large variety of formats and therefore not amenable for comparison and re-use. The Cross-Linguistic Data Formats initiative proposes new standards for two basic types of data in historical and typological language comparison (word lists, structural datasets) and a framework to incorporate more data types (e.g. parallel texts, and dictionaries). The new specification for cross-linguistic data formats comes along with a software package for validation and manipulation, a basic ontology which links to more general frameworks, and usage examples of best practices.},
copyright = {2018 The Author(s)},
langid = {english},
keywords = {cross-linguistic data format,cross-linguistic lexical database,Databases,Interdisciplinary studies,lexical database,Social anthropology},
file = {/Users/Primahadi/Library/CloudStorage/[email protected]/Other computers/My MacBook Pro/Documents/_Zotero Digital Library/Journal Article/Forkel et al_2018_Cross-Linguistic Data Formats, advancing data sharing and re-use in comparative.pdf}
}
@inproceedings{forkel_cldfbench_2020,
title = {{{CLDFBench}}: {{Give Your Cross-Linguistic Data}} a {{Lift}}},
shorttitle = {{{CLDFBench}}},
booktitle = {Proceedings of the {{Twelfth Language Resources}} and {{Evaluation Conference}}},
author = {Forkel, Robert and List, Johann-Mattis},
year = {2020},
month = may,
pages = {6995--7002},
publisher = {European Language Resources Association},
address = {Marseille, France},
urldate = {2023-06-07},
url = {https://aclanthology.org/2020.lrec-1.864},
abstract = {While the amount of cross-linguistic data is constantly increasing, most datasets produced today and in the past cannot be considered FAIR (findable, accessible, interoperable, and reproducible). To remedy this and to increase the comparability of cross-linguistic resources, it is not enough to set up standards and best practices for data to be collected in the future. We also need consistent workflows for the ``retro-standardization'' of data that has been published during the past decades and centuries. With the Cross-Linguistic Data Formats initiative, first standards for cross-linguistic data have been presented and successfully tested. So far, however, CLDF creation was hampered by the fact that it required a considerable degree of computational proficiency. With cldfbench, we introduce a framework for the retro-standardization of legacy data and the curation of new datasets that drastically simplifies the creation of CLDF by providing a consistent, reproducible workflow that rigorously supports version control and long term archiving of research data and code. The framework is distributed in form of a Python package along with usage information and examples for best practice. This study introduces the new framework and illustrates how it can be applied by showing how a resource containing structural and lexical data for Sinitic languages can be efficiently retro-standardized and analyzed.},
isbn = {979-10-95546-34-4},
langid = {english}
}
@misc{forkel_cldfbench_2023,
title = {cldfbench: {{Python}} Library Implementing a {{CLDF}} Workbench},
shorttitle = {Cldfbench},
author = {Forkel, Robert},
year = {2023},
month = sep,
urldate = {2024-07-05},
url = {https://github.com/cldf/cldfbench},
copyright = {Apache Software License}
}
@misc{forkel_pyconcepticon_2022,
title = {Pyconcepticon: Programmatic Curation of Concepticon-Data},
shorttitle = {Pyconcepticon},
author = {Forkel, Robert},
year = {2022},
month = nov,
urldate = {2023-06-02},
copyright = {Apache Software License},
keywords = {data,linguistics}
}
@misc{zumbach_deeplr_2023,
title = {Deeplr: {{Interface}} to the '{{DeepL}}' {{Translation API}}},
shorttitle = {Deeplr},
author = {Zumbach, David and Bauer, Paul C.},
year = {2023},
month = nov,
urldate = {2024-07-05},
url = {https://cran.r-project.org/package=deeplr},
abstract = {A wrapper for the 'DeepL' Pro API {$<$}https://www.deepl.com/docs-api{$>$}, a web service for translating texts between different languages. A DeepL API developer account is required to use the service (see {$<$}https://www.deepl.com/pro\#developer{$>$}).},
copyright = {MIT + file LICENSE}
}
@misc{tjuka_adding_2020,
title = {Adding Concept Lists to {{Concepticon}}: {{A}} Guide for Beginners},
shorttitle = {Adding Concept Lists to {{Concepticon}}},
author = {Tjuka, Annika},
year = {2020},
month = jan,
journal = {Computer-Assisted Language Comparison in Practice},
doi = {10.58079/m6kj},
urldate = {2023-06-02},
abstract = {Scientific data should be openly accessible. This includes databases which are designed for collaborative work. However, in most cases, these databases are only extended by a team of experts. If a database is truly collaborative, the workflows need to be accessible for everybody. The Concepticon database ~(List et al., 2019) invites contributors to include their [{\dots}]},
langid = {american}
}
@book{moran_unicode_2018,
title = {The {{Unicode}} Cookbook for Linguists: {{Managing}} Writing Systems Using Orthography Profiles},
author = {Moran, Steven and Cysouw, Michael},
year = {2018},
series = {Translation and {{Multilingual Natural Language Processing}}},
number = {10},
publisher = {Language Science Press},
address = {Berlin},
doi = {10.5281/zenodo.1296780}
}
@misc{list_converting_2021,
type = {Billet},
title = {Converting the {{Vietic Dataset}} by {{Sidwell}} and {{Alwes}} from 2021 to {{CLDF}}},
author = {List, Johann-Mattis},
year = {2021},
month = sep,
journal = {Computer-Assisted Language Comparison in Practice},
issn = {2629-5873},
doi = {10.58079/m6la},
urldate = {2024-07-05},
abstract = {A few days ago, Sidwell and Alwes submitted a very nice dataset on Vietic languages to Zenodo (10.5281/zenodo.5263194). When inspecting the data, I realized that this dataset could be easily converted to our CLDF formats in our new Lexibank standards. Since both authors explicitly invited for discussions of the data and the testing of the [{\dots}]},
langid = {american}
}
@misc{martinovic_converting_2022,
type = {Billet},
title = {Converting {{Streitberg}}'s {{Gothic Dictionary}} to a {{CLDF Wordlist}} on a {{Windows System}}},
author = {Martinovi{\'c}, Viktor},
year = {2022},
month = feb,
journal = {Computer-Assisted Language Comparison in Practice},
issn = {2629-5873},
doi = {10.58079/m6lg},
urldate = {2024-07-05},
abstract = {I recently converted the Gothic dictionary written by Wilhelm Streitberg to a CLDF wordlist. Since I was using Windows, I had some difficulties during the conversion progress, which Unix system users may not have to deal with. I thought it would be useful to share my experience here and point out that users of Windows [{\dots}]},
langid = {american}
}
@misc{barlow_cldf_2023,
title = {{{CLDF}} Dataset Derived from {{Barlow}} and {{Killian}}'s "{{Tomoip Wordlist}}" from 2023},
author = {Barlow, Russell and Killian, Don},
year = {2023},
month = oct,
publisher = {Zenodo},
doi = {10.5281/zenodo.8437515},
urldate = {2024-07-05},
abstract = {Cite the source of the dataset as: Barlow, Russell \& Killian, Don. 2023. Tomoip wordlist: Based on elicitation sessions with Simon Mangil from Milim village, recorded in Kokopo, East New Britain, October to November 2022. https://doi.org/10.5281/zenodo.8435080},
keywords = {cldf:Wordlist,linguistics}
}
@misc{zgraggen_cldf_2021,
title = {{{CLDF}} Dataset Derived from {{Z}}'graggen's "{{Madang Comparative Wordlists}}" from 1980},
author = {Z'graggen, John Anton},
year = {2021},
month = jul,
publisher = {Zenodo},
doi = {10.5281/zenodo.5121535},
urldate = {2024-07-05},
abstract = {Cite the source of the dataset as: Z'graggen, J A. (1980) A comparative word list of the Northern Adelbert Range Languages, Madang Province, Papua New Guinea. Canberra: Pacific Linguistics.},
keywords = {cldf:Wordlist,linguistics}
}