{"response":{"docs":[{"system_create_dtsi":"2022-08-10T16:15:40Z","system_modified_dtsi":"2022-08-19T15:17:43Z","has_model_ssim":["Dataset"],"id":"j098zc672","accessControl_ssim":["039ef95a-3cd3-4ec1-87df-b08403052a1b"],"hasRelatedMediaFragment_ssim":["nc580p23g"],"hasRelatedImage_ssim":["nc580p23g"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pmc_random5k.csv"],"date_uploaded_dtsi":"2022-08-10T16:15:36Z","date_modified_dtsi":"2022-08-10T16:15:37Z","isPartOf_ssim":["admin_set/default"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Natural Language Processing","Caselaw","Coherence"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/pddl/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["nc580p23g"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["nc580p23g"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMC_RANDOM5KCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/j098zc672"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763426292334592,"timestamp":"2022-11-17T17:00:39.442Z","score":0.00049999997},{"system_create_dtsi":"2022-08-10T16:15:37Z","system_modified_dtsi":"2022-08-19T15:17:45Z","has_model_ssim":["Dataset"],"id":"gh93h117t","accessControl_ssim":["deb329cb-4ba5-465c-9709-f27809390abb"],"hasRelatedMediaFragment_ssim":["xp68kh576"],"hasRelatedImage_ssim":["xp68kh576"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pmc_pollution.csv"],"date_uploaded_dtsi":"2022-08-10T16:15:36Z","date_modified_dtsi":"2022-08-10T16:15:36Z","isPartOf_ssim":["admin_set/default"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Coherence","Natural Language Processing","Caselaw"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/pddl/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["xp68kh576"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["xp68kh576"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMC_POLLUTIONCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/gh93h117t"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763427080863744,"timestamp":"2022-11-17T17:00:40.194Z","score":0.00049999997},{"system_create_dtsi":"2022-08-10T16:15:37Z","system_modified_dtsi":"2022-08-10T16:22:58Z","has_model_ssim":["Dataset"],"id":"xp68kh56x","accessControl_ssim":["86a39277-a953-4e7d-8ce8-8727091439ec"],"hasRelatedMediaFragment_ssim":["c534fq50c"],"hasRelatedImage_ssim":["c534fq50c"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pmc_environmental.csv"],"date_uploaded_dtsi":"2022-08-10T16:15:36Z","date_modified_dtsi":"2022-08-10T16:15:36Z","isPartOf_ssim":["admin_set/default"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Caselaw","Coherence","Natural Language Processing"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/pddl/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["c534fq50c"],"file_set_ids_ssim":["c534fq50c"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMC_ENVIRONMENTALCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__pathnames_ssim":["xp68kh56x"],"nesting_collection__deepest_nested_depth_isi":1,"_version_":1740791991239704576,"timestamp":"2022-08-10T16:23:32.251Z","score":0.00049999997},{"system_create_dtsi":"2022-08-10T16:15:37Z","system_modified_dtsi":"2022-08-10T16:22:59Z","has_model_ssim":["Dataset"],"id":"x920fz48z","accessControl_ssim":["e8b9a12a-0e9e-4c96-b2ad-6eb2d98a446c"],"hasRelatedMediaFragment_ssim":["k35695958"],"hasRelatedImage_ssim":["k35695958"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pmc_earth.csv"],"date_uploaded_dtsi":"2022-08-10T16:15:36Z","date_modified_dtsi":"2022-08-10T16:15:36Z","isPartOf_ssim":["admin_set/default"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Coherence","Natural Language Processing","Caselaw"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/pddl/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["k35695958"],"file_set_ids_ssim":["k35695958"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMC_EARTHCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__pathnames_ssim":["x920fz48z"],"nesting_collection__deepest_nested_depth_isi":1,"_version_":1740791993658769408,"timestamp":"2022-08-10T16:23:34.558Z","score":0.00049999997},{"system_create_dtsi":"2022-08-10T16:15:36Z","system_modified_dtsi":"2022-08-19T15:18:05Z","has_model_ssim":["Dataset"],"id":"8049g644n","accessControl_ssim":["ee9aafb9-8b69-44e5-baca-f12dbbefdeb3"],"hasRelatedMediaFragment_ssim":["hq37vq040"],"hasRelatedImage_ssim":["hq37vq040"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pmc_climate.csv"],"date_uploaded_dtsi":"2022-08-10T16:15:35Z","date_modified_dtsi":"2022-08-10T16:15:35Z","isPartOf_ssim":["admin_set/default"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Caselaw","Coherence","Natural Language Processing"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/pddl/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["hq37vq040"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["hq37vq040"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMC_CLIMATECSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/8049g644n"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763427866247168,"timestamp":"2022-11-17T17:00:40.943Z","score":0.00049999997},{"system_create_dtsi":"2022-08-10T16:15:36Z","system_modified_dtsi":"2022-08-19T15:18:06Z","has_model_ssim":["Dataset"],"id":"n870zs60z","accessControl_ssim":["9ac1c85e-3cc0-4182-80bd-8894b5a2bf18"],"hasRelatedMediaFragment_ssim":["v118rf94w"],"hasRelatedImage_ssim":["v118rf94w"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pma_random5k.csv"],"date_uploaded_dtsi":"2022-08-10T16:15:35Z","date_modified_dtsi":"2022-08-10T16:15:35Z","isPartOf_ssim":["admin_set/default"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Natural Language Processing","Caselaw","Coherence"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/pddl/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["v118rf94w"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["v118rf94w"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMA_RANDOM5KCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/n870zs60z"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763432273412096,"timestamp":"2022-11-17T17:00:45.145Z","score":0.00049999997},{"system_create_dtsi":"2022-08-10T16:15:35Z","system_modified_dtsi":"2022-08-19T15:18:08Z","has_model_ssim":["Dataset"],"id":"sf2686591","accessControl_ssim":["eb96ed91-31a5-49e1-bb00-180c7596475c"],"hasRelatedMediaFragment_ssim":["9306t098v"],"hasRelatedImage_ssim":["9306t098v"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pma_pollution.csv"],"date_uploaded_dtsi":"2022-08-10T16:15:34Z","date_modified_dtsi":"2022-08-10T16:15:34Z","isPartOf_ssim":["admin_set/default"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Natural Language Processing","Coherence","Caselaw"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/pddl/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["9306t098v"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["9306t098v"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMA_POLLUTIONCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/sf2686591"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763430469861376,"timestamp":"2022-11-17T17:00:43.426Z","score":0.00049999997},{"system_create_dtsi":"2022-08-10T16:15:24Z","system_modified_dtsi":"2022-08-19T15:18:10Z","has_model_ssim":["Dataset"],"id":"z603r0113","accessControl_ssim":["41499eba-4008-4888-aa2d-3c2f6c529850"],"hasRelatedMediaFragment_ssim":["pc289k57z"],"hasRelatedImage_ssim":["pc289k57z"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pma_environmental.csv"],"date_uploaded_dtsi":"2022-08-10T16:15:23Z","date_modified_dtsi":"2022-08-10T16:15:23Z","isPartOf_ssim":["admin_set/default"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Caselaw","Natural Language Processing","Coherence"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/pddl/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["pc289k57z"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["pc289k57z"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMA_ENVIRONMENTALCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/z603r0113"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763428927406080,"timestamp":"2022-11-17T17:00:41.955Z","score":0.00049999997},{"system_create_dtsi":"2022-08-10T16:15:21Z","system_modified_dtsi":"2022-08-19T15:18:12Z","has_model_ssim":["Dataset"],"id":"ws859h23z","accessControl_ssim":["f139e1c3-f34b-4be1-8eab-752783e5d594"],"hasRelatedMediaFragment_ssim":["5t34sk935"],"hasRelatedImage_ssim":["5t34sk935"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pma_climate.csv"],"date_uploaded_dtsi":"2022-08-10T16:15:19Z","date_modified_dtsi":"2022-08-10T16:15:20Z","isPartOf_ssim":["admin_set/default"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Natural Language Processing","Caselaw","Coherence"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/pddl/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["5t34sk935"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["5t34sk935"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMA_CLIMATECSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/ws859h23z"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763431006732288,"timestamp":"2022-11-17T17:00:43.938Z","score":0.00049999997},{"system_create_dtsi":"2022-08-10T16:15:21Z","system_modified_dtsi":"2022-08-19T15:18:14Z","has_model_ssim":["Dataset"],"id":"zg64tn46s","accessControl_ssim":["ac266158-d4c4-40bf-994c-24d268fbea06"],"hasRelatedMediaFragment_ssim":["ns064749n"],"hasRelatedImage_ssim":["ns064749n"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pma_earth.csv"],"date_uploaded_dtsi":"2022-08-10T16:15:20Z","date_modified_dtsi":"2022-08-10T16:15:20Z","isPartOf_ssim":["admin_set/default"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Coherence","Caselaw","Natural Language Processing"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/pddl/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["ns064749n"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["ns064749n"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMA_EARTHCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/zg64tn46s"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763433627123712,"timestamp":"2022-11-17T17:00:46.437Z","score":0.00049999997}],"facets":[{"name":"human_readable_type_sim","items":[{"value":"Dataset","hits":15,"label":"Dataset"}],"label":"Human Readable Type Sim"},{"name":"creator_sim","items":[{"value":"McCabe, Erin E.","hits":15,"label":"McCabe, Erin E."}],"label":"Creator Sim"},{"name":"subject_sim","items":[{"value":"Caselaw","hits":15,"label":"Caselaw"},{"value":"Coherence","hits":15,"label":"Coherence"},{"value":"Natural Language Processing","hits":15,"label":"Natural Language Processing"}],"label":"Subject Sim"},{"name":"college_sim","items":[{"value":"Libraries","hits":15,"label":"Libraries"}],"label":"College Sim"},{"name":"department_sim","items":[{"value":"Digital Scholarship Center (DSC)","hits":15,"label":"Digital Scholarship Center (DSC)"}],"label":"Department Sim"},{"name":"language_sim","items":[{"value":"English","hits":15,"label":"English"}],"label":"Language Sim"},{"name":"publisher_sim","items":[{"value":"University of Cincinnati","hits":15,"label":"University of Cincinnati"}],"label":"Publisher Sim"},{"name":"date_created_sim","items":[{"value":"2022","hits":15,"label":"2022"}],"label":"Date Created Sim"},{"name":"member_of_collection_ids_ssim","items":[{"value":"rr171z875","hits":13,"label":"rr171z875"}],"label":"Member Of Collection Ids Ssim"},{"name":"generic_type_sim","items":[{"value":"Work","hits":15,"label":"Work"}],"label":"Generic Type Sim"}],"pages":{"current_page":1,"next_page":2,"prev_page":null,"total_pages":2,"limit_value":10,"offset_value":0,"total_count":15,"first_page?":true,"last_page?":false}}}