-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathsdg.properties
82 lines (46 loc) · 6.98 KB
/
sdg.properties
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
[VIVO]
# set the namespace to be used by all URI generated by the sample data
ns = http://vivo.mydomain.edu/individual/
[SDG]
# Set the name of the university to be created.
university_name = Sample University
# a list of college names. The Sample Data Generator will select at random from the names you provide
college_names = Science, Arts, Humanities, Design, Government, Fine Arts, Environment, Rehabilitation Sciences, Social Work, Natural Resources, Human Development, Law, Management, Public Affairs, Public Health, Social Sciences, Information Science, Architecture, Education, Medicine, Pharmacy, Nursing, Business, Journalism, Liberal Arts, Engineering, Dentistry, Veterinary Medicine, Biological Sciences, Recreation, Health Professions, Information Technology, Agriculture
# a list of department names. The same data generator will select at random from the name you provide
department_names = Science, Arts, Chemistry, Physics, Mathematics, Statistics, Astronomy, Classics, Chinese, French, Religious Studies, Aeronautics, Humanities, Design, Government, Fine Arts, Environment, Rehabilitation Sciences, Social Work, Natural Resources, Human Development, Law, Management, Public Affairs, Public Health, Social Sciences, Information Science, Architecture, Education, Medicine, Pharmacy, Nursing, Business, Journalism, Liberal Arts, Engineering, Dentistry, Veterinary Medicine, Biological Sciences, Recreation, Health Professions, Information Technology, Agriculture
# Given/first names of people. SDG will create names at random, selecting a rnadom first name, a random middle initial, and a random last/family name
first_names = Al, Bob, Charley, Daniel, Edgar, Frank, Gina, Harriet, Izzy, James, Kristi, Lauren, Michael, Nathan, Olivia, Pedro, Qzim, Robert, Sara, Tanisha, Udell, Violeta, Walter, Xinithia, Yiola, Zevon
# Given/last names of people. Add more for increased variety/diversity/localization/internationalization
last_names = Amos, Barclay, Chisolm, Drew, Etherton, Franks, George, Hermann, Ithimore, Jones, Kendall, Laon, Marks, Nunes, Oscar, Paddington, Qura, Roberts, Stevens, Thomas, Ulam, Veronique, Williams, Xerxes, Yvette, Zebra
# The lorem text is used to provide overviews, titles of works, and abstracts. Random slices are made and combined.
lorem = Sed ornare, neque et scelerisque placerat, diam arcu tincidunt tortor, id maximus ex nulla ut nibh. Curabitur eget mi ac justo vehicula euismod. Morbi scelerisque rhoncus dui non finibus. Nam ut lobortis nunc. Maecenas magna quam, semper vitae velit ac, cursus tempor est. Class aptent taciti sociosqu ad litora torquent per conubia nostra, per inceptos himenaeos. Morbi enim quam, rutrum sollicitudin tincidunt vitae, sodales et nibh. Pellentesque habitant morbi tristique senectus et netus et malesuada fames ac turpis egestas. Aliquam pulvinar convallis est vel semper. Sed tristique ut felis eget bibendum. Cras varius dui commodo massa venenatis suscipit id in mauris. Interdum et malesuada fames ac ante ipsum primis in faucibus. Nulla at nibh in orci lacinia elementum et eget ante. Phasellus iaculis lectus in diam egestas molestie. Vestibulum non consequat est, a molestie ex
# Set the minimum number of colleges for your sample university. SDG will generate a university with somewhere between min and max number of colleges. If min = max, that number will be used.
min_colleges_per_university = 1
# The maximum number of colleges for your sample university. Be careful. Large numbers will generate large amounts of data
max_colleges_per_university = 1
# the number of academic departments per college. Some college will have less, some more, but all will be in the range [min, max]
min_departments_per_college = 1
max_departments_per_college = 1
# the number of faculty per academic department. If there are 3 colleges, and each has 3 departments, and each department has 30 faculty members, your university will have 270 faculty.
min_faculty_per_department = 5
max_faculty_per_department = 20
# the number of works first authored by the faculty member. The faculty member will be co-author on others. If 270 faculty average 50 works, that's 13,500 works
min_works_per_faculty = 0
max_works_per_faculty = 50
# The language tag to be used on triples generated by SDG. All the text in this file should be in the language specified by the tag.
lang = en
# The relative frequency of the kinds of works in the collection you would like to generate. SDG generates 25 different kinds of works -- academic articles, books, software, etc
# The first number is the relative frequency of academic articles. The second number is for blog posts. The number "300" indicates there should be 60 times as many academic articles in the
# generated data as there are blog posts. If all the numbers are the same, an equal distribution of works will be generated. The 25 types are
# AcademicArticle, BlogPosting, Book, BookSection, CaseStudy, Chapter, ConferencePaper, ConferencePoster, Database, EditedBook, EditorialArticle, ExtensionDocument, Film, Letter, Newsletter,
# NewsRelease, Patent, Report, Review, Software, Speech, Thesis, Video, Webpage, Website
# If the relative frequency of a kind of work is 0, no works of that kind will be generated
# As an example, to generate data with many Films, change the 13th number in the list below from 5 to something larger such as 100. Then Films would be generated 20 times as often as the
# kinds that have a 5 such as BlogPosting, and would be generated about 1/3 as often as AcademicArticles
work_type_frequency = 300, 5, 10, 10, 5, 10, 20, 20, 10, 5, 10, 15, 5, 10, 5, 10, 15, 20, 15, 10, 10, 10, 10, 5, 5
# People are given random titles from the list below. Add more titles for more diversity
titles = Instructor, Visiting Professor, Assistant Professor, Associate Professor, Professor, Professor Emeritus, Director, Chair, Dean
# Concepts are assigned to people as research areas and to works as subject areas. Add more for more diversity.
concepts = France 1500-1599, Physics, Urology, P53 tumor gene, Informatics, Economics, Behavioral Economics, Hypertension, Sports Journalism, Manifold algebra, Music theory, Derrida, Baseball, Marxism, Gender equity, Battle of Gettysburg, British Royal Navy, Bauhaus, Cubism, Coffee cultivation, 35mm photography, Obstetrics, Liver Transplant, Bavaria, Criminology, Probability Theory, Epistemology, Ontology, Set Theory, Political Parties
# Works are assigned to journals. Add more journals for more diversity.
journals = Cell, Nature, Science, Circulation, Journal of the American Statistical Association, Library Science, PloS Biology, PLoS One, JAMA, American Journal of Psychiatry, Acta Astronautica, Journal of Teacher Education, Angewandte Chemie, The Lancet, Data Intelligence, Journal of Biochemistry, Acta Paediatrica, Inorganic Chemistry, Annals of Internal Medicine, Accounts of Chemical Research, Journal of Ecology, Advanced Materials, Physical Review, Journal of Biology, Acta Mathematica, Proceedings of the Royal Society, New England Journal of Medicine, Annals of Mathematics, Annals of Chemistry