{"response":{"docs":[{"system_create_dtsi":"2022-11-12T19:46:46Z","system_modified_dtsi":"2022-11-12T19:47:19Z","has_model_ssim":["Dataset"],"id":"707958958","accessControl_ssim":["251ae43c-f283-4634-84d5-69b117121960"],"hasRelatedMediaFragment_ssim":["8049g6466"],"hasRelatedImage_ssim":["8049g6466"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - nvl_pollution.csv"],"date_uploaded_dtsi":"2022-11-12T19:46:46Z","date_modified_dtsi":"2022-11-12T19:46:46Z","isPartOf_ssim":["admin_set/default"],"doi_tesim":["doi:10.7945/6ns7-e762"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Literature","Natural Language Processing","Topic Coherence"],"language_tesim":["English"],"description_tesim":["CSV files containing the coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one from) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc] / News [nws]\r\nSearchTerm[s] = (one from) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/by/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["8049g6466"],"file_set_ids_ssim":["8049g6466"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS NVL_POLLUTIONCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__pathnames_ssim":["707958958"],"nesting_collection__deepest_nested_depth_isi":1,"_version_":1749763232689553408,"timestamp":"2022-11-17T16:57:34.808Z","score":0.00049999997},{"system_create_dtsi":"2022-11-12T19:43:40Z","system_modified_dtsi":"2022-11-12T19:44:13Z","has_model_ssim":["Dataset"],"id":"n583xw57d","accessControl_ssim":["223b8d23-1644-4c49-bae6-0952a0aa9b21"],"hasRelatedMediaFragment_ssim":["rr171z90g"],"hasRelatedImage_ssim":["rr171z90g"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - nvl_earth.csv"],"date_uploaded_dtsi":"2022-11-12T19:43:40Z","date_modified_dtsi":"2022-11-12T19:43:40Z","isPartOf_ssim":["admin_set/default"],"doi_tesim":["doi:10.7945/cs9y-0a69"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Topic Coherence","Natural Language Processing","Literature"],"language_tesim":["English"],"description_tesim":["CSV files containing the coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one from) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc] / News [nws]\r\nSearchTerm[s] = (one from) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/by/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["rr171z90g"],"file_set_ids_ssim":["rr171z90g"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS NVL_EARTHCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__pathnames_ssim":["n583xw57d"],"nesting_collection__deepest_nested_depth_isi":1,"_version_":1749763234449063936,"timestamp":"2022-11-17T16:57:36.485Z","score":0.00049999997},{"system_create_dtsi":"2022-11-12T19:38:15Z","system_modified_dtsi":"2022-11-12T19:38:48Z","has_model_ssim":["Dataset"],"id":"t148fj58c","accessControl_ssim":["6edf7700-e5d3-412c-9f37-bd6b4e04b666"],"hasRelatedMediaFragment_ssim":["tx31qk08g"],"hasRelatedImage_ssim":["tx31qk08g"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - nvl_climate.csv"],"date_uploaded_dtsi":"2022-11-12T19:38:15Z","date_modified_dtsi":"2022-11-12T19:38:15Z","isPartOf_ssim":["admin_set/default"],"doi_tesim":["doi:10.7945/zzbj-9614"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Literature","Topic Coherence","Natural Language Processing"],"language_tesim":["English"],"description_tesim":["CSV files containing the coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one from) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc] / News [nws]\r\nSearchTerm[s] = (one from) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/by/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["tx31qk08g"],"file_set_ids_ssim":["tx31qk08g"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS NVL_CLIMATECSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__pathnames_ssim":["t148fj58c"],"nesting_collection__deepest_nested_depth_isi":1,"_version_":1749763237045338112,"timestamp":"2022-11-17T16:57:38.962Z","score":0.00049999997},{"system_create_dtsi":"2022-11-12T19:34:49Z","system_modified_dtsi":"2022-11-12T19:35:24Z","has_model_ssim":["Dataset"],"id":"c247dt64g","accessControl_ssim":["453b03d9-1b9f-4f87-97f8-06a5405f798e"],"hasRelatedMediaFragment_ssim":["8c97ks093"],"hasRelatedImage_ssim":["8c97ks093"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - nvl_environmental.csv"],"date_uploaded_dtsi":"2022-11-12T19:34:49Z","date_modified_dtsi":"2022-11-12T19:34:49Z","isPartOf_ssim":["admin_set/default"],"doi_tesim":["doi:10.7945/mb5f-s989"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Natural Language Processing","Literature"],"language_tesim":["English"],"description_tesim":["CSV files containing the coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one from) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc] / News [nws]\r\nSearchTerm[s] = (one from) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/by/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["8c97ks093"],"file_set_ids_ssim":["8c97ks093"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS NVL_ENVIRONMENTALCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__pathnames_ssim":["c247dt64g"],"nesting_collection__deepest_nested_depth_isi":1,"_version_":1749763238038339584,"timestamp":"2022-11-17T16:57:39.909Z","score":0.00049999997},{"system_create_dtsi":"2022-11-05T18:21:59Z","system_modified_dtsi":"2022-11-11T20:11:54Z","has_model_ssim":["Dataset"],"id":"rj430607v","accessControl_ssim":["8b94e2c2-5b9f-426d-a1af-b31d272e1ec6"],"hasRelatedMediaFragment_ssim":["dn39x2990"],"hasRelatedImage_ssim":["dn39x2990"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - nvl_random5k.csv "],"date_uploaded_dtsi":"2022-11-05T18:21:58Z","date_modified_dtsi":"2022-11-11T20:11:54Z","isPartOf_ssim":["admin_set/default"],"doi_tesim":["doi:10.7945/nfyj-ah72"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Literature","Natural Language Processing","Coherence"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/by/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["dn39x2990","3f4627019"],"file_set_ids_ssim":["dn39x2990","3f4627019"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS NVL_RANDOM5KCSV ","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__pathnames_ssim":["rj430607v"],"nesting_collection__deepest_nested_depth_isi":1,"_version_":1749763239566114816,"timestamp":"2022-11-17T16:57:41.366Z","score":0.00049999997},{"system_create_dtsi":"2022-11-04T21:01:40Z","system_modified_dtsi":"2022-11-04T21:02:13Z","has_model_ssim":["Dataset"],"id":"j098zc69m","accessControl_ssim":["ce8802a6-24a9-42e4-afcd-7c59b18cd762"],"hasRelatedMediaFragment_ssim":["pz50gx64p"],"hasRelatedImage_ssim":["pz50gx64p"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pmc_environmental.csv"],"date_uploaded_dtsi":"2022-11-04T21:01:39Z","date_modified_dtsi":"2022-11-04T21:01:39Z","isPartOf_ssim":["admin_set/default"],"doi_tesim":["doi:10.7945/6594-eh39"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Coherence","Natural Language Processing"],"language_tesim":["English"],"description_tesim":["CSV files containing the topic coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one of) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc]\r\nSearchTerm[s] = (one of) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/by/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["pz50gx64p"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["pz50gx64p"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMC_ENVIRONMENTALCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/j098zc69m"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763426623684608,"timestamp":"2022-11-17T17:00:39.758Z","score":0.00049999997},{"system_create_dtsi":"2022-11-04T20:59:15Z","system_modified_dtsi":"2022-11-04T20:59:45Z","has_model_ssim":["Dataset"],"id":"ws859h247","accessControl_ssim":["d5425468-13fd-46fd-be6b-e9448cd7e9fb"],"hasRelatedMediaFragment_ssim":["m900nw083"],"hasRelatedImage_ssim":["m900nw083"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - pmc_earth.csv"],"date_uploaded_dtsi":"2022-11-04T20:59:14Z","date_modified_dtsi":"2022-11-04T20:59:14Z","isPartOf_ssim":["admin_set/default"],"doi_tesim":["doi:10.7945/qvpa-cg58"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Coherence","Natural Language Processing"],"language_tesim":["English"],"description_tesim":["CSV files containing the coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one from) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc] / News [nws]\r\nSearchTerm[s] = (one from) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/by/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["m900nw083"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["m900nw083"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS PMC_EARTHCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/ws859h247"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763424311574528,"timestamp":"2022-11-17T17:00:37.553Z","score":0.00049999997},{"system_create_dtsi":"2022-11-04T20:12:13Z","system_modified_dtsi":"2022-11-04T20:12:44Z","has_model_ssim":["Dataset"],"id":"8623j034w","accessControl_ssim":["a3e24de7-cc95-4011-a0d3-d361c1c5fd50"],"hasRelatedMediaFragment_ssim":["9z903144z"],"hasRelatedImage_ssim":["9z903144z"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - nws_environmental.csv "],"date_uploaded_dtsi":"2022-11-04T20:12:12Z","date_modified_dtsi":"2022-11-04T20:12:12Z","isPartOf_ssim":["admin_set/default"],"doi_tesim":["doi:10.7945/d7c6-rj84"],"geo_subject_tesim":["United States"],"time_period_tesim":["21st century"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Coherence","Natural Language Processing","News"],"language_tesim":["English"],"description_tesim":["CSV files containing the coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one from) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc] / News [nws]\r\nSearchTerm[s] = (one from) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row\r\n\r\n"],"license_tesim":["http://www.opendatacommons.org/licenses/by/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["9z903144z"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["9z903144z"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS NWS_ENVIRONMENTALCSV ","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/8623j034w"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763428416749568,"timestamp":"2022-11-17T17:00:41.468Z","score":0.00049999997},{"system_create_dtsi":"2022-11-04T20:07:52Z","system_modified_dtsi":"2022-11-04T20:08:24Z","has_model_ssim":["Dataset"],"id":"sn00b033c","accessControl_ssim":["4f027e1b-5afd-4662-9707-67da7e749e97"],"hasRelatedMediaFragment_ssim":["4j03d1130"],"hasRelatedImage_ssim":["4j03d1130"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - nws_random5k.csv "],"date_uploaded_dtsi":"2022-11-04T20:07:51Z","date_modified_dtsi":"2022-11-04T20:07:51Z","isPartOf_ssim":["admin_set/default"],"doi_tesim":["doi:10.7945/3s6j-j390"],"time_period_tesim":["21st century"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Coherence","News","Natural Language Processing"],"language_tesim":["English"],"description_tesim":["CSV files containing the coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one from) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc] / News [nws]\r\nSearchTerm[s] = (one from) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/by/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["4j03d1130"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["4j03d1130"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS NWS_RANDOM5KCSV ","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/sn00b033c"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763422492295168,"timestamp":"2022-11-17T17:00:35.818Z","score":0.00049999997},{"system_create_dtsi":"2022-11-03T16:58:49Z","system_modified_dtsi":"2022-11-17T16:56:18Z","has_model_ssim":["Dataset"],"id":"jq085m40n","accessControl_ssim":["274117d2-6c08-4a05-b55e-c8d89e8d6fcf"],"hasRelatedMediaFragment_ssim":["x346d567v"],"hasRelatedImage_ssim":["x346d567v"],"depositor_ssim":["mccabeen@ucmail.uc.edu"],"depositor_tesim":["mccabeen@ucmail.uc.edu"],"title_tesim":["Coherence_Evaluations - nws_pollution.csv"],"date_uploaded_dtsi":"2022-11-03T16:58:48Z","date_modified_dtsi":"2022-11-17T16:56:14Z","isPartOf_ssim":["admin_set/default"],"doi_tesim":["doi:10.7945/yevs-9z66"],"geo_subject_tesim":["United States"],"time_period_tesim":["21st century"],"college_tesim":["Libraries"],"department_tesim":["Digital Scholarship Center (DSC)"],"creator_tesim":["McCabe, Erin E."],"publisher_tesim":["University of Cincinnati"],"subject_tesim":["Coherence","News","Natural Language Processing"],"language_tesim":["English"],"description_tesim":["CSV files containing the coherence scoring pertaining to datasets of:\r\nDocumentCount = 5,000\r\nCorpus = (one from) Federal Caselaw [cas] / Pubmed-Abstracts [pma] / Pubmed-Central [pmc] / News [nws]\r\nSearchTerm[s] = (one from) Earth / Environmental / Climate / Pollution / Random 5k documents of a specific corpus\r\n\r\nCoherence was scored across every combination of:\r\nTopicCount: 10-40\r\nHyperparameter-Alpha: [0.01, 0.31, 0.61, 0.91, symmetric, asymmetric]\r\nHyperparameter-Beta: [0.01, 0.31, 0.61, 0.91, automatic, symmetric]\r\n\r\nThe columns in this file include:\r\nValidation_Set: Which search term this scoring pertains to\r\nTopics: Number of topics in the model\r\nAlpha: Hyperparameter alpha selection from the 6 options above\r\nBeta: Hyperparameter beta selection from the 6 options above\r\nCoherence: The topic coherence score for the given model-row\r\nPerplexity: The perplexity score for the given model-row"],"license_tesim":["http://www.opendatacommons.org/licenses/by/1.0/"],"date_created_tesim":["2022"],"thumbnail_path_ss":"/assets/work-ff055336041c3f7d310ad69109eda4a887b16ec501f35afc0a547c4adb97ee72.png","suppressed_bsi":false,"actionable_workflow_roles_ssim":["admin_set/default-default-depositing"],"workflow_state_name_ssim":["deposited"],"member_ids_ssim":["x346d567v"],"member_of_collections_ssim":["Coherence Evaluations for 'Model of Models' Methods"],"member_of_collection_ids_ssim":["rr171z875"],"file_set_ids_ssim":["x346d567v"],"visibility_ssi":"open","admin_set_tesim":["Default Admin Set"],"sort_title_ssi":"COHERENCE_EVALUATIONS NWS_POLLUTIONCSV","human_readable_type_tesim":["Dataset"],"read_access_group_ssim":["public"],"edit_access_group_ssim":["admin"],"edit_access_person_ssim":["mccabeen@ucmail.uc.edu"],"nesting_collection__ancestors_ssim":["ng451k09w","ng451k09w/rr171z875"],"nesting_collection__parent_ids_ssim":["rr171z875"],"nesting_collection__pathnames_ssim":["ng451k09w/rr171z875/jq085m40n"],"nesting_collection__deepest_nested_depth_isi":3,"_version_":1749763421166895104,"timestamp":"2022-11-17T17:00:34.554Z","score":0.00049999997}],"facets":[{"name":"human_readable_type_sim","items":[{"value":"Dataset","hits":43,"label":"Dataset"},{"value":"Image","hits":3,"label":"Image"}],"label":"Human Readable Type Sim"},{"name":"creator_sim","items":[{"value":"McCabe, Erin E.","hits":46,"label":"McCabe, Erin E."}],"label":"Creator Sim"},{"name":"subject_sim","items":[{"value":"Natural Language Processing","hits":46,"label":"Natural Language Processing"},{"value":"Coherence","hits":23,"label":"Coherence"},{"value":"Topic Models","hits":19,"label":"Topic Models"},{"value":"Centrality","hits":16,"label":"Centrality"},{"value":"Caselaw","hits":15,"label":"Caselaw"},{"value":"Topic Coherence","hits":6,"label":"Topic Coherence"}],"label":"Subject Sim"},{"name":"college_sim","items":[{"value":"Libraries","hits":46,"label":"Libraries"}],"label":"College Sim"},{"name":"department_sim","items":[{"value":"Digital Scholarship Center (DSC)","hits":46,"label":"Digital Scholarship Center (DSC)"}],"label":"Department Sim"},{"name":"language_sim","items":[{"value":"English","hits":46,"label":"English"}],"label":"Language Sim"},{"name":"publisher_sim","items":[{"value":"University of Cincinnati","hits":46,"label":"University of Cincinnati"}],"label":"Publisher Sim"},{"name":"date_created_sim","items":[{"value":"2022","hits":46,"label":"2022"}],"label":"Date Created Sim"},{"name":"member_of_collection_ids_ssim","items":[{"value":"rr171z875","hits":20,"label":"rr171z875"},{"value":"12579t889","hits":16,"label":"12579t889"},{"value":"ng451k09w","hits":3,"label":"ng451k09w"}],"label":"Member Of Collection Ids Ssim"},{"name":"generic_type_sim","items":[{"value":"Work","hits":46,"label":"Work"}],"label":"Generic Type Sim"}],"pages":{"current_page":1,"next_page":2,"prev_page":null,"total_pages":5,"limit_value":10,"offset_value":0,"total_count":46,"first_page?":true,"last_page?":false}}}