| A | B | C | D | E | F | G | H | I | J | K | L | M | N | O | P | Q | R | S | T | U | V | W | X | |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
1 | prompt | actual | predicted | tag | match | Human Analysis | Corrected actual | |||||||||||||||||
2 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'aid'; examples: ['18401', '17770', '17721', '16858', '15268', '15113', '14826', '14230', '12788', '9286', '8561']"}] | #meta+id | #beneficiary+ind | #meta | FALSE | #meta+id | ||||||||||||||||||
3 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'name'; examples: ['South Sudan - Floods', 'South Sudan - Population Movement from Sudan', 'South Sudan - Cholera Outbreak Upper Nile', 'South Sudan - Anticipatory Actions EVD Outbreak', 'South Sudan - Floods', 'South Sudan - Floods', 'South Sudan - Ebola Virus Disease Preparedness', 'South Sudan - Complex Emergency', 'South Sudan - Cholera', 'South Sudan - Cholera', 'Republic of South Sudan - Complex Emergency']"}] | #crisis+name | #crisis | FALSE | Prediction blank | #crisis+name | ||||||||||||||||||
4 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'dtype.id'; examples: ['12', '5', '1', '1', '12', '12', '1', '6', '1', '1', '7']"}] | #cause+id | #meta+id | #cause | FALSE | #cause+id | ||||||||||||||||||
5 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'dtype.name'; examples: ['Flood', 'Population Movement', 'Epidemic', 'Epidemic', 'Flood', 'Flood', 'Epidemic', 'Complex Emergency', 'Epidemic', 'Epidemic', 'Civil Unrest']"}] | #cause+name | #crisis+type | #cause | FALSE | #cause+name | ||||||||||||||||||
6 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'status'; examples: ['0', '0', '1', '1', '1', '1', '1', '1', '1', '1', '1']"}] | #status+code | #status | #status | FALSE | Scenario 5 - labelled has extra correct attribute prediction doesn't (eg 'code') | #status+code | |||||||||||||||||
7 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'status_display'; examples: ['Active', 'Active', 'Closed', 'Closed', 'Closed', 'Closed', 'Closed', 'Closed', 'Closed', 'Closed', 'Closed']"}] | #status+name | #status+name | #status | TRUE | #status+name | ||||||||||||||||||
8 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'start_date'; examples: ['2024-07-25T00:00:00Z', '2023-05-08T00:00:00Z', '2023-03-20T00:00:00Z', '2022-10-13T00:00:00Z', '2019-11-25T00:00:00Z', '2019-06-22T00:00:00Z', '2018-10-16T00:00:00Z', '2017-07-08T00:00:00Z', '2016-07-29T00:00:00Z', '2015-07-06T00:00:00Z', '2014-01-09T00:00:00Z']"}] | #date+start | #date+start | #date | TRUE | #date+start | ||||||||||||||||||
9 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'end_date'; examples: ['2024-09-30T00:00:00Z', '2023-08-31T00:00:00Z', '2023-07-31T00:00:00Z', '2023-01-31T00:00:00Z', '2021-07-31T00:00:00Z', '2019-11-22T00:00:00Z', '2019-02-28T00:00:00Z', '2018-12-31T00:00:00Z', '2016-12-27T00:00:00Z', '2015-10-20T00:00:00Z', '2015-07-31T00:00:00Z']"}] | #date+end | #date+end | #date | TRUE | #date+end | ||||||||||||||||||
10 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'country.iso3'; examples: ['SSD', 'SSD', 'SSD', 'SSD', 'SSD', 'SSD', 'SSD', 'SSD', 'SSD', 'SSD', 'SSD']"}] | #country+code | #country+code | #country | TRUE | #country+code | ||||||||||||||||||
11 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'country.name'; examples: ['South Sudan', 'South Sudan', 'South Sudan', 'South Sudan', 'South Sudan', 'South Sudan', 'South Sudan', 'South Sudan', 'South Sudan', 'South Sudan', 'South Sudan']"}] | #country+name | #country+name | #country | TRUE | #country+name | ||||||||||||||||||
12 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'region.id'; examples: ['0', '0', '0', '0', '0', '0', '0', '0', '0', '0', '0']"}] | #region+id | #adm1+code | #region | FALSE | Scenario 1 - predicted 'adm1' where label is 'region' region | #adm1+code | |||||||||||||||||
13 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for South Sudan8.csv'; dataset_description='The dataset contains information on various appeals and events related to South Sudan, including details such as the type of appeal, status, sector, amount requested and funded, start and end dates, as well as country-specific information like country code, region, and average household size. The data includes appeals for different crises such as floods, population movements, cholera outbreaks, and Ebola preparedness, with details on beneficiaries and confirmation needs. The dataset also includes metadata such as IDs, names, and translation modules for countries and regions.'; column_name:'region.region_name'; examples: ['Africa', 'Africa', 'Africa', 'Africa', 'Africa', 'Africa', 'Africa', 'Africa', 'Africa', 'Africa', 'Africa']"}] | #region+name | #region+name | #region | TRUE | #region+name | ||||||||||||||||||
14 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2016-2023 SDN Insecurity Insight Data3.xlsx'; dataset_description='The dataset contains information on various events related to insecurity in Sudan from 2016 to 2023, including data on Aid Worker KIKA Events, Attacks on Health Care Events, Conflict-related Sexual Violence Events, Education in Danger Events, Explosive Weapons Events, Food Security Protection in Danger Events. The data shows the number of events recorded each year for these categories, with some missing values for certain years. The dataset provides insights into the trends and occurrences of insecurity events in Sudan over the specified time period.'; column_name:'Country'; examples: ['Sudan', 'Sudan', 'Sudan', 'Sudan', 'Sudan', 'Sudan', 'Sudan', 'Sudan']"}] | #country+name | #country+name | #country | TRUE | #country+name | ||||||||||||||||||
15 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe6.csv'; dataset_description='The dataset contains information on various indicators related to health and demographics in Sao Tome and Principe, with data points for different regions within the country. The indicators include total fertility rate for women aged 15-49, percentage of married women currently using contraception, and percentage of married women using modern contraception methods. The data includes values, precision, survey details, and characteristic categories for each indicator. The dataset covers the year 2008 and is sourced from the DHS (Demographic and Health Surveys) program.'; column_name:'ISO3'; examples: ['STP', 'STP', 'STP', 'STP', 'STP', 'STP', 'STP', 'STP', 'STP', 'STP', 'STP']"}] | #country+code | #country+code | #country | TRUE | #country+code | ||||||||||||||||||
16 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe6.csv'; dataset_description='The dataset contains information on various indicators related to health and demographics in Sao Tome and Principe, with data points for different regions within the country. The indicators include total fertility rate for women aged 15-49, percentage of married women currently using contraception, and percentage of married women using modern contraception methods. The data includes values, precision, survey details, and characteristic categories for each indicator. The dataset covers the year 2008 and is sourced from the DHS (Demographic and Health Surveys) program.'; column_name:'Location'; examples: ['Região Centro', 'Região Sul', 'Região Norte', 'Região do Principe', 'Região Centro', 'Região Sul', 'Região Norte', 'Região do Principe', 'Região Centro', 'Região Sul', 'Região Norte']"}] | #loc+name | #adm1+name | #loc | FALSE | Scenario 9 - prediction correct (adm1), label incorrect (loc) | #loc+name | |||||||||||||||||
17 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe6.csv'; dataset_description='The dataset contains information on various indicators related to health and demographics in Sao Tome and Principe, with data points for different regions within the country. The indicators include total fertility rate for women aged 15-49, percentage of married women currently using contraception, and percentage of married women using modern contraception methods. The data includes values, precision, survey details, and characteristic categories for each indicator. The dataset covers the year 2008 and is sourced from the DHS (Demographic and Health Surveys) program.'; column_name:'DataId'; examples: ['3517584', '2078280', '2086067', '2078289', '4220627', '5306972', '1182398', '4673618', '4220628', '5306973', '1182399']"}] | #meta+id | #meta+id | #meta | TRUE | #meta+id | ||||||||||||||||||
18 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe6.csv'; dataset_description='The dataset contains information on various indicators related to health and demographics in Sao Tome and Principe, with data points for different regions within the country. The indicators include total fertility rate for women aged 15-49, percentage of married women currently using contraception, and percentage of married women using modern contraception methods. The data includes values, precision, survey details, and characteristic categories for each indicator. The dataset covers the year 2008 and is sourced from the DHS (Demographic and Health Surveys) program.'; column_name:'Indicator'; examples: ['Total fertility rate 15-49', 'Total fertility rate 15-49', 'Total fertility rate 15-49', 'Total fertility rate 15-49', 'Married women currently using any method of contraception', 'Married women currently using any method of contraception', 'Married women currently using any method of contraception', 'Married women currently using any method of contraception', 'Married women currently using any modern method of contraception', 'Married women currently using any modern method of contraception', 'Married women currently using any modern method of contraception']"}] | #indicator+name | #indicator+name | #indicator | TRUE | #indicator+name | ||||||||||||||||||
19 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe6.csv'; dataset_description='The dataset contains information on various indicators related to health and demographics in Sao Tome and Principe, with data points for different regions within the country. The indicators include total fertility rate for women aged 15-49, percentage of married women currently using contraception, and percentage of married women using modern contraception methods. The data includes values, precision, survey details, and characteristic categories for each indicator. The dataset covers the year 2008 and is sourced from the DHS (Demographic and Health Surveys) program.'; column_name:'CountryName'; examples: ['Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe']"}] | #country+name | #country+name | #country | TRUE | #country+name | ||||||||||||||||||
20 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe6.csv'; dataset_description='The dataset contains information on various indicators related to health and demographics in Sao Tome and Principe, with data points for different regions within the country. The indicators include total fertility rate for women aged 15-49, percentage of married women currently using contraception, and percentage of married women using modern contraception methods. The data includes values, precision, survey details, and characteristic categories for each indicator. The dataset covers the year 2008 and is sourced from the DHS (Demographic and Health Surveys) program.'; column_name:'IndicatorId'; examples: ['FE_FRTR_W_TFR', 'FE_FRTR_W_TFR', 'FE_FRTR_W_TFR', 'FE_FRTR_W_TFR', 'FP_CUSM_W_ANY', 'FP_CUSM_W_ANY', 'FP_CUSM_W_ANY', 'FP_CUSM_W_ANY', 'FP_CUSM_W_MOD', 'FP_CUSM_W_MOD', 'FP_CUSM_W_MOD']"}] | #indicator+code | #indicator+id | #indicator | FALSE | Scenario 4 - 'code' and 'id' ambiguity in HXL standard | #indicator+id | |||||||||||||||||
21 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe6.csv'; dataset_description='The dataset contains information on various indicators related to health and demographics in Sao Tome and Principe, with data points for different regions within the country. The indicators include total fertility rate for women aged 15-49, percentage of married women currently using contraception, and percentage of married women using modern contraception methods. The data includes values, precision, survey details, and characteristic categories for each indicator. The dataset covers the year 2008 and is sourced from the DHS (Demographic and Health Surveys) program.'; column_name:'ByVariableId'; examples: ['0', '0', '0', '0', '0', '0', '0', '0', '0', '0', '0']"}] | #indicator+code+label | #indicator+type | #indicator | FALSE | #indicator+code+label | ||||||||||||||||||
22 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe7.csv'; dataset_description='The dataset contains various indicators related to demographic and health statistics for Sao Tome and Principe in 2008, sourced from the DHS Quickstats Data file. The indicators include total fertility rate, contraceptive use among married women, unmet need for family planning, median age at first marriage and sexual intercourse, and infant mortality rates. Each data entry includes information such as the indicator name, value, precision, country code, survey details, and characteristic categories. The dataset provides insights into key health and demographic trends in Sao Tome and Principe during the specified survey year.'; column_name:'ISO3'; examples: ['STP', 'STP', 'STP', 'STP', 'STP', 'STP', 'STP', 'STP', 'STP', 'STP', 'STP']"}] | #country+code | #country+code | #country | TRUE | #country+code | ||||||||||||||||||
23 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe7.csv'; dataset_description='The dataset contains various indicators related to demographic and health statistics for Sao Tome and Principe in 2008, sourced from the DHS Quickstats Data file. The indicators include total fertility rate, contraceptive use among married women, unmet need for family planning, median age at first marriage and sexual intercourse, and infant mortality rates. Each data entry includes information such as the indicator name, value, precision, country code, survey details, and characteristic categories. The dataset provides insights into key health and demographic trends in Sao Tome and Principe during the specified survey year.'; column_name:'DataId'; examples: ['338517', '29286', '29287', '70060', '5442', '295240', '443078', '286160', '247074', '307207', '240622']"}] | #meta+id | #meta+id | #meta | TRUE | #meta+id | ||||||||||||||||||
24 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe7.csv'; dataset_description='The dataset contains various indicators related to demographic and health statistics for Sao Tome and Principe in 2008, sourced from the DHS Quickstats Data file. The indicators include total fertility rate, contraceptive use among married women, unmet need for family planning, median age at first marriage and sexual intercourse, and infant mortality rates. Each data entry includes information such as the indicator name, value, precision, country code, survey details, and characteristic categories. The dataset provides insights into key health and demographic trends in Sao Tome and Principe during the specified survey year.'; column_name:'Indicator'; examples: ['Total fertility rate 15-49', 'Married women currently using any method of contraception', 'Married women currently using any modern method of contraception', 'Unmet need for family planning', 'Demand for family planning satisfied by modern methods', 'Median age at first marriage [Women]: 25-49', 'Median age at first sexual intercourse [Women]: 25-49', 'Infant mortality rate', 'Infant mortality rate', 'Under-five mortality rate', 'Under-five mortality rate']"}] | #indicator+name | #indicator+name | #indicator | TRUE | #indicator+name | ||||||||||||||||||
25 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe7.csv'; dataset_description='The dataset contains various indicators related to demographic and health statistics for Sao Tome and Principe in 2008, sourced from the DHS Quickstats Data file. The indicators include total fertility rate, contraceptive use among married women, unmet need for family planning, median age at first marriage and sexual intercourse, and infant mortality rates. Each data entry includes information such as the indicator name, value, precision, country code, survey details, and characteristic categories. The dataset provides insights into key health and demographic trends in Sao Tome and Principe during the specified survey year.'; column_name:'CountryName'; examples: ['Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe', 'Sao Tome and Principe']"}] | #country+name | #country+name | #country | TRUE | #country+name | ||||||||||||||||||
26 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe7.csv'; dataset_description='The dataset contains various indicators related to demographic and health statistics for Sao Tome and Principe in 2008, sourced from the DHS Quickstats Data file. The indicators include total fertility rate, contraceptive use among married women, unmet need for family planning, median age at first marriage and sexual intercourse, and infant mortality rates. Each data entry includes information such as the indicator name, value, precision, country code, survey details, and characteristic categories. The dataset provides insights into key health and demographic trends in Sao Tome and Principe during the specified survey year.'; column_name:'IndicatorId'; examples: ['FE_FRTR_W_TFR', 'FP_CUSM_W_ANY', 'FP_CUSM_W_MOD', 'FP_NADM_W_UNT', 'FP_NADM_W_PDM', 'MA_AAFM_W_M2B', 'SX_AAFS_W_M2B', 'CM_ECMR_C_IMR', 'CM_ECMR_C_IMR', 'CM_ECMR_C_U5M', 'CM_ECMR_C_U5M']"}] | #indicator+code | #indicator+id | #indicator | FALSE | Scenario 4 - 'code' and 'id' ambiguity in HXL standard | #indicator+id | |||||||||||||||||
27 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe7.csv'; dataset_description='The dataset contains various indicators related to demographic and health statistics for Sao Tome and Principe in 2008, sourced from the DHS Quickstats Data file. The indicators include total fertility rate, contraceptive use among married women, unmet need for family planning, median age at first marriage and sexual intercourse, and infant mortality rates. Each data entry includes information such as the indicator name, value, precision, country code, survey details, and characteristic categories. The dataset provides insights into key health and demographic trends in Sao Tome and Principe during the specified survey year.'; column_name:'ByVariableId'; examples: ['0', '0', '0', '0', '0', '0', '0', '14001', '14003', '14001', '14003']"}] | #indicator+code+label | #indicator+id | #indicator | FALSE | Scenario 4 - 'code' and 'id' ambiguity in HXL standard | #indicator+id | |||||||||||||||||
28 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/DHS Quickstats Data for Sao Tome and Principe7.csv'; dataset_description='The dataset contains various indicators related to demographic and health statistics for Sao Tome and Principe in 2008, sourced from the DHS Quickstats Data file. The indicators include total fertility rate, contraceptive use among married women, unmet need for family planning, median age at first marriage and sexual intercourse, and infant mortality rates. Each data entry includes information such as the indicator name, value, precision, country code, survey details, and characteristic categories. The dataset provides insights into key health and demographic trends in Sao Tome and Principe during the specified survey year.'; column_name:'ByVariableLabel'; examples: ['', '', '', '', '', '', '', 'Five years preceding the survey', 'Ten years preceding the survey', 'Five years preceding the survey', 'Ten years preceding the survey']"}] | #indicator+label | #indicator+type | #indicator | FALSE | Scenario 4 - 'code' and 'id' ambiguity in HXL standard | #indicator+type | |||||||||||||||||
29 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/EMDAT-country-profiles_2024_07_292.xlsx'; dataset_description='The dataset contains information on disasters that occurred in various countries in the year 2000. It includes details such as the country, disaster type, total events, total affected individuals, total deaths, total damage in USD, and the Corruption Perceptions Index (CPI) for each country. The disasters recorded include droughts, floods, storms, wildfires, and landslides. The dataset provides a snapshot of the impact of natural disasters on different countries in the year 2000, highlighting the number of affected individuals, deaths, and economic damage caused by these events.'; column_name:'Year'; examples: [2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000, 2000]"}] | #date+occurred | #date | #date | FALSE | Scenario 5 - labelled has extra correct attribute prediction doesn't (eg 'code') | #date+occurred | |||||||||||||||||
30 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/EMDAT-country-profiles_2024_07_292.xlsx'; dataset_description='The dataset contains information on disasters that occurred in various countries in the year 2000. It includes details such as the country, disaster type, total events, total affected individuals, total deaths, total damage in USD, and the Corruption Perceptions Index (CPI) for each country. The disasters recorded include droughts, floods, storms, wildfires, and landslides. The dataset provides a snapshot of the impact of natural disasters on different countries in the year 2000, highlighting the number of affected individuals, deaths, and economic damage caused by these events.'; column_name:'Country'; examples: ['Afghanistan', 'Algeria', 'Algeria', 'Algeria', 'Angola', 'Angola', 'Angola', 'Argentina', 'Argentina', 'Argentina', 'Argentina']"}] | #country+name | #country+name | #country | TRUE | #country+name | ||||||||||||||||||
31 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/EMDAT-country-profiles_2024_07_292.xlsx'; dataset_description='The dataset contains information on disasters that occurred in various countries in the year 2000. It includes details such as the country, disaster type, total events, total affected individuals, total deaths, total damage in USD, and the Corruption Perceptions Index (CPI) for each country. The disasters recorded include droughts, floods, storms, wildfires, and landslides. The dataset provides a snapshot of the impact of natural disasters on different countries in the year 2000, highlighting the number of affected individuals, deaths, and economic damage caused by these events.'; column_name:'ISO'; examples: ['AFG', 'DZA', 'DZA', 'DZA', 'AGO', 'AGO', 'AGO', 'ARG', 'ARG', 'ARG', 'ARG']"}] | #country+code | #country+code | #country | TRUE | #country+code | ||||||||||||||||||
32 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/EMDAT-country-profiles_2024_07_292.xlsx'; dataset_description='The dataset contains information on disasters that occurred in various countries in the year 2000. It includes details such as the country, disaster type, total events, total affected individuals, total deaths, total damage in USD, and the Corruption Perceptions Index (CPI) for each country. The disasters recorded include droughts, floods, storms, wildfires, and landslides. The dataset provides a snapshot of the impact of natural disasters on different countries in the year 2000, highlighting the number of affected individuals, deaths, and economic damage caused by these events.'; column_name:'Disaster Type'; examples: ['Drought', 'Flood', 'Flood', 'Storm', 'Flood', 'Flood', 'Mass movement (wet)', 'Wildfire', 'Flood', 'Flood', 'Extreme temperature']"}] | #cause+type | #event+type | #cause | FALSE | #cause+type | ||||||||||||||||||
33 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/EMDAT-country-profiles_2024_07_292.xlsx'; dataset_description='The dataset contains information on disasters that occurred in various countries in the year 2000. It includes details such as the country, disaster type, total events, total affected individuals, total deaths, total damage in USD, and the Corruption Perceptions Index (CPI) for each country. The disasters recorded include droughts, floods, storms, wildfires, and landslides. The dataset provides a snapshot of the impact of natural disasters on different countries in the year 2000, highlighting the number of affected individuals, deaths, and economic damage caused by these events.'; column_name:'Total Events'; examples: [1, 2, 2, 1, 3, 1, 1, 1, 3, 1, 1]"}] | #frequency | #event | #frequency | FALSE | #frequency | ||||||||||||||||||
34 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/EMDAT-country-profiles_2024_07_292.xlsx'; dataset_description='The dataset contains information on disasters that occurred in various countries in the year 2000. It includes details such as the country, disaster type, total events, total affected individuals, total deaths, total damage in USD, and the Corruption Perceptions Index (CPI) for each country. The disasters recorded include droughts, floods, storms, wildfires, and landslides. The dataset provides a snapshot of the impact of natural disasters on different countries in the year 2000, highlighting the number of affected individuals, deaths, and economic damage caused by these events.'; column_name:'Total Affected'; examples: [2580000, 105, 100, 10, 9011, 70000, '', '', 31840, 6000, 300]"}] | #affected+ind | #affected | #affected | FALSE | Scenario 5 - labelled has extra correct attribute prediction doesn't (eg 'code') | #affected+ind | |||||||||||||||||
35 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/EMDAT-country-profiles_2024_07_292.xlsx'; dataset_description='The dataset contains information on disasters that occurred in various countries in the year 2000. It includes details such as the country, disaster type, total events, total affected individuals, total deaths, total damage in USD, and the Corruption Perceptions Index (CPI) for each country. The disasters recorded include droughts, floods, storms, wildfires, and landslides. The dataset provides a snapshot of the impact of natural disasters on different countries in the year 2000, highlighting the number of affected individuals, deaths, and economic damage caused by these events.'; column_name:'Total Deaths'; examples: [37, 37, 7, 4, 15, 31, 13, 8, 6, 7, 15]"}] | #affected+ind+killed | #affected+killed | #affected | FALSE | Scenario 5 - labelled has extra correct attribute prediction doesn't (eg 'code') | #affected+ind+killed | |||||||||||||||||
36 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/hdx-hxl-datasets3.csv'; dataset_description='The dataset contains information on various humanitarian response plans and hazard data for disaster risk assessment from different sources and organizations. It includes details such as dataset names, titles, organizations, sources, and creation/update dates. The data covers topics like displacement trends tracking, storm, wildfire, flood, earthquake, crop production, operational presence in Mozambique, attacks on protection in Bangladesh, and exposure data for disaster risk assessment. The dataset appears to be focused on providing valuable information for humanitarian efforts and disaster management.'; column_name:'HDX org'; examples: ['international-organization-for-migration', 'eth-zurich-weather-and-climate-risks', 'eth-zurich-weather-and-climate-risks', 'eth-zurich-weather-and-climate-risks', 'eth-zurich-weather-and-climate-risks', 'eth-zurich-weather-and-climate-risks', 'ocha-mozambique-hat', 'eth-zurich-weather-and-climate-risks', 'insecurity-insight', 'ipc', 'ipc']"}] | #org+code | #org+id | #org | FALSE | Scenario 4 - 'code' and 'id' ambiguity in HXL standard | #org+id | |||||||||||||||||
37 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/hdx-hxl-datasets3.csv'; dataset_description='The dataset contains information on various humanitarian response plans and hazard data for disaster risk assessment from different sources and organizations. It includes details such as dataset names, titles, organizations, sources, and creation/update dates. The data covers topics like displacement trends tracking, storm, wildfire, flood, earthquake, crop production, operational presence in Mozambique, attacks on protection in Bangladesh, and exposure data for disaster risk assessment. The dataset appears to be focused on providing valuable information for humanitarian efforts and disaster management.'; column_name:'Source'; examples: ['International Organization for Migration (IOM)', 'ETH Zurich Climada', 'ETH Zurich Climada', 'ETH Zurich Climada', 'ETH Zurich Climada', 'ETH Zurich Climada', 'Humanitarian partners', 'ETH Zurich Climada', 'Insecurity Insight', 'National IPC Technical Working Group', 'National IPC Technical Working Group']"}] | #meta+source | #org+name | #meta | FALSE | #meta+source | ||||||||||||||||||
38 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/hdx-hxl-datasets3.csv'; dataset_description='The dataset contains information on various humanitarian response plans and hazard data for disaster risk assessment from different sources and organizations. It includes details such as dataset names, titles, organizations, sources, and creation/update dates. The data covers topics like displacement trends tracking, storm, wildfire, flood, earthquake, crop production, operational presence in Mozambique, attacks on protection in Bangladesh, and exposure data for disaster risk assessment. The dataset appears to be focused on providing valuable information for humanitarian efforts and disaster management.'; column_name:'Date created'; examples: ['2024-03-06', '2024-03-06', '2024-03-06', '2024-02-28', '2024-02-23', '2024-02-08', '2024-01-26', '2024-01-10', '2024-01-09', '2023-12-23', '2023-12-22']"}] | #date+start | #date | #date | FALSE | Scenario 5 - labelled has extra correct attribute prediction doesn't (eg 'code') | #date+start | |||||||||||||||||
39 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/OxCGRT_CSV3.csv'; dataset_description='The dataset contains information on various measures and indicators related to COVID-19 response for different countries and regions. It includes data such as government responses, containment measures, economic support, vaccination policies, confirmed cases, confirmed deaths, majority vaccinated status, population vaccinated, stringency index, and other related indices. The data is structured with columns representing different aspects of the response measures and indicators, with rows corresponding to specific dates and locations.'; column_name:'CountryName'; examples: ['Aruba', 'Aruba', 'Aruba', 'Aruba', 'Aruba', 'Aruba', 'Aruba', 'Aruba', 'Aruba', 'Aruba', 'Aruba']"}] | #country | #country+name | #country | FALSE | Scenario 3 - prediction adds extra correct attribute (eg 'name', 'code') | #country+name | |||||||||||||||||
40 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/OxCGRT_CSV3.csv'; dataset_description='The dataset contains information on various measures and indicators related to COVID-19 response for different countries and regions. It includes data such as government responses, containment measures, economic support, vaccination policies, confirmed cases, confirmed deaths, majority vaccinated status, population vaccinated, stringency index, and other related indices. The data is structured with columns representing different aspects of the response measures and indicators, with rows corresponding to specific dates and locations.'; column_name:'CountryCode'; examples: ['ABW', 'ABW', 'ABW', 'ABW', 'ABW', 'ABW', 'ABW', 'ABW', 'ABW', 'ABW', 'ABW']"}] | #country+code | #country+code | #country | TRUE | #country+code | ||||||||||||||||||
41 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/OxCGRT_CSV3.csv'; dataset_description='The dataset contains information on various measures and indicators related to COVID-19 response for different countries and regions. It includes data such as government responses, containment measures, economic support, vaccination policies, confirmed cases, confirmed deaths, majority vaccinated status, population vaccinated, stringency index, and other related indices. The data is structured with columns representing different aspects of the response measures and indicators, with rows corresponding to specific dates and locations.'; column_name:'Date'; examples: ['20200101', '20200102', '20200103', '20200104', '20200105', '20200106', '20200107', '20200108', '20200109', '20200110', '20200111']"}] | #date | #date | #date | TRUE | #date | ||||||||||||||||||
42 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2022 IRN SHCC Health Care Data3.xlsx'; dataset_description='The dataset contains information on health care-related incidents in Iran, including details such as the date, country, reported perpetrator, weapons used, number of attacks on health facilities, destruction and damage to health facilities, occupation of health facilities, health transportation status, looting/theft incidents, obstruction to health care, and harm to health workers (killed, injured, kidnapped, arrested, threatened, assaulted, sexually assaulted). The data also includes information on different categories of health workers affected, such as international health workers, national employees of aid agencies, and local health workers. Additionally, the dataset includes details on conflict-related violence, politically-related violence, COVID-19-related violence, Ebola-related violence, vaccination-related violence, and unique event IDs associated with each entry.'; column_name:'Date'; examples: ['2022-09-16', '2022-09-19', '2022-09-20', '2022-09-21', '2022-09-21', '2022-09-22', '2022-09-22', '2022-09-24', '2022-09-26', '2022-09-30', '2022-10-01']"}] | #date | #date | #date | TRUE | #date | ||||||||||||||||||
43 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2022 IRN SHCC Health Care Data3.xlsx'; dataset_description='The dataset contains information on health care-related incidents in Iran, including details such as the date, country, reported perpetrator, weapons used, number of attacks on health facilities, destruction and damage to health facilities, occupation of health facilities, health transportation status, looting/theft incidents, obstruction to health care, and harm to health workers (killed, injured, kidnapped, arrested, threatened, assaulted, sexually assaulted). The data also includes information on different categories of health workers affected, such as international health workers, national employees of aid agencies, and local health workers. Additionally, the dataset includes details on conflict-related violence, politically-related violence, COVID-19-related violence, Ebola-related violence, vaccination-related violence, and unique event IDs associated with each entry.'; column_name:'Country'; examples: ['Iran', 'Iran', 'Iran', 'Iran', 'Iran', 'Iran', 'Iran', 'Iran', 'Iran', 'Iran', 'Iran']"}] | #country+name | #country+name | #country | TRUE | #country+name | ||||||||||||||||||
44 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2022 IRN SHCC Health Care Data3.xlsx'; dataset_description='The dataset contains information on health care-related incidents in Iran, including details such as the date, country, reported perpetrator, weapons used, number of attacks on health facilities, destruction and damage to health facilities, occupation of health facilities, health transportation status, looting/theft incidents, obstruction to health care, and harm to health workers (killed, injured, kidnapped, arrested, threatened, assaulted, sexually assaulted). The data also includes information on different categories of health workers affected, such as international health workers, national employees of aid agencies, and local health workers. Additionally, the dataset includes details on conflict-related violence, politically-related violence, COVID-19-related violence, Ebola-related violence, vaccination-related violence, and unique event IDs associated with each entry.'; column_name:'SiND Event ID'; examples: [38057, 35283, 38199, 38052, 35619, 35621, 38125, 37892, 35630, 38200, 37877]"}] | #event+id | #event+id | #event | TRUE | #event+id | ||||||||||||||||||
45 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/Black Sea Initiative Vessel Movements3.xlsx'; dataset_description='The dataset contains information on voyages undertaken by ships under the Black Sea Grain Initiative from August 1, 2022, to July 17, 2023. The data is sourced from the United Nations Joint Coordination Centre website and is presented in two tabs: DATA and DATA_HXL. The columns in the dataset include information such as status, outbound sequence, and departure port. The dataset provides details on shipments, voyage sequences, and departure ports related to the Black Sea Grain Initiative vessel movements.'; column_name:'Country'; examples: ['The Netherlands', 'The Netherlands', 'Iraq', 'Tunisia', 'China', 'France', 'Türkiye', 'Ethiopia', 'India', 'China', 'China']"}] | #country+name | #country+name | #country | TRUE | #country+name | ||||||||||||||||||
46 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2022 SHCC Incident Data3.xlsx'; dataset_description='The dataset contains information on incidents related to health facilities and workers in various countries, including details on the date, country, reported perpetrator, weapons used, number of attacks on health facilities, and impact on health workers. The data includes categories such as destruction, damage, occupation, abduction, assault, and threats to health workers, as well as details on the type of violence involved (conflict-related, politically-related, COVID-19-related, etc.). Each entry provides specific information on the incident, such as the type of weapon used, the number of health workers affected, and the outcome of any kidnappings or arrests.'; column_name:'Date'; examples: ['2022-01-01', '2022-01-01', '2022-01-01', '2022-01-01', '2022-01-01', '2022-01-02', '2022-01-02', '2022-01-04', '2022-01-04', '2022-01-05', '2022-01-05']"}] | #date | #date | #date | TRUE | #data+occurred | ||||||||||||||||||
47 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2022 SHCC Incident Data3.xlsx'; dataset_description='The dataset contains information on incidents related to health facilities and workers in various countries, including details on the date, country, reported perpetrator, weapons used, number of attacks on health facilities, and impact on health workers. The data includes categories such as destruction, damage, occupation, abduction, assault, and threats to health workers, as well as details on the type of violence involved (conflict-related, politically-related, COVID-19-related, etc.). Each entry provides specific information on the incident, such as the type of weapon used, the number of health workers affected, and the outcome of any kidnappings or arrests.'; column_name:'Country'; examples: ['Myanmar', 'Myanmar', 'Myanmar', 'Myanmar', 'Sudan', 'Myanmar', 'Sudan', 'Myanmar', 'Myanmar', 'Nigeria', 'Nigeria']"}] | #country+name | #country+name | #country | TRUE | #country+name | ||||||||||||||||||
48 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2022 SHCC Incident Data3.xlsx'; dataset_description='The dataset contains information on incidents related to health facilities and workers in various countries, including details on the date, country, reported perpetrator, weapons used, number of attacks on health facilities, and impact on health workers. The data includes categories such as destruction, damage, occupation, abduction, assault, and threats to health workers, as well as details on the type of violence involved (conflict-related, politically-related, COVID-19-related, etc.). Each entry provides specific information on the incident, such as the type of weapon used, the number of health workers affected, and the outcome of any kidnappings or arrests.'; column_name:'SiND Event ID'; examples: [30419, 30908, 30860, 30288, 30540, 30290, 30542, 30289, 30291, 34034, 30744]"}] | #event+id | #event+id | #event | TRUE | #event+id | ||||||||||||||||||
49 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/Burundi- Muyinga, Cankuzo, Makamba, Ruyigi, Rutana, Rumonge: Operational Presence3.xlsx'; dataset_description='nan'; column_name:'Source'; examples: ['Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data']"}] | #meta+source | #meta+source | #meta | TRUE | #meta+source | ||||||||||||||||||
50 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/Burundi- Muyinga, Cankuzo, Makamba, Ruyigi, Rutana, Rumonge: Operational Presence3.xlsx'; dataset_description='nan'; column_name:'Organisation Name'; examples: ['A.B.D.D.M', 'A.B.D.D.M', 'A.B.D.D.M', 'A.B.D.D.M', 'ACT Alliance', 'ACT Alliance', 'ACT Alliance', 'ACT Alliance', 'Action Aid', 'Action Aid', 'Action Aid']"}] | #org+impl | #org+name | #org | FALSE | Scenario 6 - labelled correct 'impl', prediction uses also correct 'name' | #org+name | |||||||||||||||||
51 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/Burundi- Muyinga, Cankuzo, Makamba, Ruyigi, Rutana, Rumonge: Operational Presence3.xlsx'; dataset_description='nan'; column_name:'Organisation Type'; examples: ['Private Sector', 'Private Sector', 'Private Sector', 'Private Sector', 'International NGO', 'International NGO', 'International NGO', 'International NGO', 'International NGO', 'International NGO', 'International NGO']"}] | #org+type | #org+type | #org | TRUE | #org+type | ||||||||||||||||||
52 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/Burundi- Muyinga, Cankuzo, Makamba, Ruyigi, Rutana, Rumonge: Operational Presence3.xlsx'; dataset_description='nan'; column_name:'Country'; examples: ['Burundi', 'Burundi', 'Burundi', 'Burundi', 'Burundi', 'Burundi', 'Burundi', 'Burundi', 'Burundi', 'Burundi', 'Burundi']"}] | #adm1+name | #country+name | #adm1 | FALSE | Scenario 2 - labelled 'adm1', predicted 'country' (admin 0) | #country+name | |||||||||||||||||
53 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/Burundi- Muyinga, Cankuzo, Makamba, Ruyigi, Rutana, Rumonge: Operational Presence3.xlsx'; dataset_description='nan'; column_name:'Region'; examples: ['Muyinga', 'Muyinga', 'Muyinga', 'Muyinga', 'Cankuzo', 'Rumonge', 'Ruyigi', 'Ruyigi', 'Makamba', 'Makamba', 'Rutana']"}] | #region+name | #adm1+name | #region | FALSE | Scenario 1 - predicted 'adm1' where label is 'region' region | #adm1+name | |||||||||||||||||
54 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/Burundi- Muyinga, Cankuzo, Makamba, Ruyigi, Rutana, Rumonge: Operational Presence3.xlsx'; dataset_description='nan'; column_name:'Location'; examples: ['Giteranyi', 'Giteranyi', 'Muyinga', 'Muyinga', 'Gisigara', 'Rumonge', 'Gisuru', 'Kiniyia', 'Kayogoro', 'Nyanza-Lac', 'Giharo']"}] | #adm2+name | #loc+name | #adm2 | FALSE | Scenario 8 - prediction incorrect (adm2) | #adm2+name | |||||||||||||||||
55 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/Burundi- Muyinga, Cankuzo, Makamba, Ruyigi, Rutana, Rumonge: Operational Presence3.xlsx'; dataset_description='nan'; column_name:'Sector'; examples: ['Protection', 'Health and nutrition', 'Protection', 'Health and nutrition', 'Protection', 'Education', 'Protection', 'Protection', 'Health and nutrition', 'Health and nutrition', 'Education']"}] | #sector+name | #sector | #sector | FALSE | Scenario 5 - labelled has extra correct attribute prediction doesn't (eg 'code') | #sector+name | |||||||||||||||||
56 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2016-2023 Attacks on Vaccination Campaigns3.xlsx'; dataset_description='The dataset contains information on attacks on vaccination campaigns from 2016 to 2023, including details such as the date, country, reported perpetrator, weapons used, number of attacks on health facilities, health workers affected (killed, injured, kidnapped, arrested), and other related indicators. The data includes specific incidents in countries like Afghanistan, Pakistan, and Nigeria, with information on the perpetrators and the outcomes of the attacks. The dataset provides a comprehensive overview of the challenges and threats faced by health workers and vaccination campaigns during this period.'; column_name:'Date'; examples: ['2016-01-10', '2016-01-13', '2016-01-15', '2016-01-19', '2016-02-06', '2016-02-17', '2016-03-16', '2016-03-17', '2016-03-17', '2016-03-26', '2016-05-16']"}] | #date | #date | #date | TRUE | #data+occurred | ||||||||||||||||||
57 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2016-2023 Attacks on Vaccination Campaigns3.xlsx'; dataset_description='The dataset contains information on attacks on vaccination campaigns from 2016 to 2023, including details such as the date, country, reported perpetrator, weapons used, number of attacks on health facilities, health workers affected (killed, injured, kidnapped, arrested), and other related indicators. The data includes specific incidents in countries like Afghanistan, Pakistan, and Nigeria, with information on the perpetrators and the outcomes of the attacks. The dataset provides a comprehensive overview of the challenges and threats faced by health workers and vaccination campaigns during this period.'; column_name:'Country'; examples: ['Afghanistan', 'Pakistan', 'Afghanistan', 'Pakistan', 'Afghanistan', 'Pakistan', 'Pakistan', 'Pakistan', 'Nigeria', 'Pakistan', 'Pakistan']"}] | #country+name | #country+name | #country | TRUE | #country+name | ||||||||||||||||||
58 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'aid'; examples: ['6973', '6144', '87', '805', '624']"}] | #meta+id | #beneficiary+ind | #meta | FALSE | #meta+id | ||||||||||||||||||
59 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'name'; examples: ['Uzbekistan - Population Movement', 'Uzbekistan - Explosion', 'Uzbekistan: Drought', 'Uzbekistan', 'Uzbekistan']"}] | #crisis+name | #activity+name | #crisis | FALSE | #crisis+name | ||||||||||||||||||
60 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'dtype.id'; examples: ['5', '13', '20', '13', '13']"}] | #cause+id | #meta+id | #cause | FALSE | #cause+id | ||||||||||||||||||
61 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'dtype.name'; examples: ['Population Movement', 'Other', 'Drought', 'Other', 'Other']"}] | #cause+name | #sector | #cause | FALSE | Scenario 5 - labelled has extra correct attribute prediction doesn't (eg 'code') | #cause+name | |||||||||||||||||
62 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'status'; examples: ['1', '1', '1', '1', '1']"}] | #status+code | #status | #status | FALSE | Scenario 5 - labelled has extra correct attribute prediction doesn't (eg 'code') | #status+code | |||||||||||||||||
63 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'status_display'; examples: ['Closed', 'Closed', 'Closed', 'Closed', 'Closed']"}] | #status+name | #status+name | #status | TRUE | #status+name | ||||||||||||||||||
64 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'start_date'; examples: ['2010-06-15T00:00:00Z', '2008-07-28T00:00:00Z', '2001-08-21T00:00:00Z', '1999-01-01T00:00:00Z', '1997-01-01T00:00:00Z']"}] | #date+start | #date+start | #date | TRUE | #date+start | ||||||||||||||||||
65 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'end_date'; examples: ['2010-12-31T00:00:00Z', '2008-10-31T00:00:00Z', '2001-12-20T00:00:00Z', '1999-12-31T00:00:00Z', '1997-12-31T00:00:00Z']"}] | #date+end | #date+end | #date | TRUE | #date+end | ||||||||||||||||||
66 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'country.iso3'; examples: ['UZB', 'UZB', 'UZB', 'UZB', 'UZB']"}] | #country+code | #country+code | #country | TRUE | #country+code | ||||||||||||||||||
67 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'country.name'; examples: ['Uzbekistan', 'Uzbekistan', 'Uzbekistan', 'Uzbekistan', 'Uzbekistan']"}] | #country+name | #country+name | #country | TRUE | #country+name | ||||||||||||||||||
68 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'region.id'; examples: ['3', '3', '3', '3', '3']"}] | #region+id | #region+id | #region | TRUE | #region+id | ||||||||||||||||||
69 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IFRC Appeals Data for Uzbekistan3.csv'; dataset_description='The dataset contains information on IFRC appeals data for Uzbekistan, including details such as appeal ID, name, type, status, sector, funding amounts, start and end dates, and country information. The data includes appeals related to population movement, explosions, drought, and general assistance in Uzbekistan. The dataset also includes details on the organization involved, such as the Red Crescent Society of Uzbekistan, as well as information on the region, beneficiaries, and confirmation status.'; column_name:'region.region_name'; examples: ['Europe', 'Europe', 'Europe', 'Europe', 'Europe']"}] | #region+name | #region+name | #region | TRUE | #region+name | ||||||||||||||||||
70 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2014-2018 - Somalia Death Rates3.xlsx'; dataset_description='The dataset contains information on death rates in various regions of Somalia from 2014 to 2018. It includes data such as the state, region, district, crude death rate, and under 5 years death rate. Each entry specifies the state, region, district, and corresponding death rates for both crude deaths and deaths under 5 years of age. The dataset provides a snapshot of mortality rates in different areas of Somalia over the specified time period.'; column_name:'STATE'; examples: ['Hirshabelle', 'South West', 'Jubaland', 'Jubaland', 'Jubaland', 'Somaliland', 'Hirshabelle', 'Banadir', 'Puntland', 'South West', 'South West']"}] | #region+name | #adm1+name | #region | FALSE | Scenario 1 - predicted 'adm1' where label is 'region' region | #adm1+name | |||||||||||||||||
71 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2014-2018 - Somalia Death Rates3.xlsx'; dataset_description='The dataset contains information on death rates in various regions of Somalia from 2014 to 2018. It includes data such as the state, region, district, crude death rate, and under 5 years death rate. Each entry specifies the state, region, district, and corresponding death rates for both crude deaths and deaths under 5 years of age. The dataset provides a snapshot of mortality rates in different areas of Somalia over the specified time period.'; column_name:'REGION'; examples: ['Middle Shabelle', 'Lower Shabelle', 'Lower Juba', 'Gedo', 'Lower Juba', 'Awdal', 'Middle Shabelle', 'Banadir', 'Bari', 'Lower Shabelle', 'Bay']"}] | #adm1+name | #adm1+name | #adm1 | TRUE | #adm1+name | ||||||||||||||||||
72 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2014-2018 - Somalia Death Rates3.xlsx'; dataset_description='The dataset contains information on death rates in various regions of Somalia from 2014 to 2018. It includes data such as the state, region, district, crude death rate, and under 5 years death rate. Each entry specifies the state, region, district, and corresponding death rates for both crude deaths and deaths under 5 years of age. The dataset provides a snapshot of mortality rates in different areas of Somalia over the specified time period.'; column_name:'PCODE'; examples: ['SO21', 'SO23', 'SO28', 'SO26', 'SO28', 'SO11', 'SO21', 'SO22', 'SO16', 'SO23', 'SO24']"}] | #adm1+code | #adm1+code | #adm1 | TRUE | #adm1+code | ||||||||||||||||||
73 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2014-2018 - Somalia Death Rates3.xlsx'; dataset_description='The dataset contains information on death rates in various regions of Somalia from 2014 to 2018. It includes data such as the state, region, district, crude death rate, and under 5 years death rate. Each entry specifies the state, region, district, and corresponding death rates for both crude deaths and deaths under 5 years of age. The dataset provides a snapshot of mortality rates in different areas of Somalia over the specified time period.'; column_name:'DISTRICT'; examples: ['Adan Yabaal', 'Afgooye', 'Afmadow', 'Baardheere', 'Badhaadhe', 'Baki', 'Balcad', 'Banadir', 'Bandarbeyla', 'Baraawe', 'Baydhaba']"}] | #adm2+name | #adm2+name | #adm2 | TRUE | #adm2+name | ||||||||||||||||||
74 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/2014-2018 - Somalia Death Rates3.xlsx'; dataset_description='The dataset contains information on death rates in various regions of Somalia from 2014 to 2018. It includes data such as the state, region, district, crude death rate, and under 5 years death rate. Each entry specifies the state, region, district, and corresponding death rates for both crude deaths and deaths under 5 years of age. The dataset provides a snapshot of mortality rates in different areas of Somalia over the specified time period.'; column_name:'PCODE DISTRICT'; examples: ['SO2102', 'SO2302', 'SO2802', 'SO2602', 'SO2803', 'SO1102', 'SO2103', 'SO2201', 'SO1602', 'SO2303', 'SO2401']"}] | #adm2+code | #adm2+code | #adm2 | TRUE | #adm2+code | ||||||||||||||||||
75 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': 'What are the HXL tags and attributes for a column with these details? resource_name=\'/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/SDG 4 Global and Thematic data3.csv\'; dataset_description=\'The dataset titled "SDG 4 Global and Thematic data3.csv" contains information on various indicators, country IDs, years, values, magnitudes, and qualifiers. The data includes indicator codes, country codes, and numerical values for different indicators across multiple years. For example, there are entries for indicator "ADMI.ENDOFLOWERSEC.MAT" and "ADMI.ENDOFLOWERSEC.READ" for the country with the country code "ZWE" from 2014 to 2021. The dataset appears to track specific metrics or indicators over time for different countries.\'; column_name:\'indicator_id\'; examples: [\'ADMI.ENDOFLOWERSEC.MAT\', \'ADMI.ENDOFLOWERSEC.MAT\', \'ADMI.ENDOFLOWERSEC.MAT\', \'ADMI.ENDOFLOWERSEC.MAT\', \'ADMI.ENDOFLOWERSEC.MAT\', \'ADMI.ENDOFLOWERSEC.MAT\', \'ADMI.ENDOFLOWERSEC.MAT\', \'ADMI.ENDOFLOWERSEC.MAT\', \'ADMI.ENDOFLOWERSEC.READ\', \'ADMI.ENDOFLOWERSEC.READ\', \'ADMI.ENDOFLOWERSEC.READ\']'}] | #indicator+code | #indicator+id | #indicator | FALSE | Scenario 4 - 'code' and 'id' ambiguity in HXL standard | #indicator+id | |||||||||||||||||
76 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': 'What are the HXL tags and attributes for a column with these details? resource_name=\'/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/SDG 4 Global and Thematic data3.csv\'; dataset_description=\'The dataset titled "SDG 4 Global and Thematic data3.csv" contains information on various indicators, country IDs, years, values, magnitudes, and qualifiers. The data includes indicator codes, country codes, and numerical values for different indicators across multiple years. For example, there are entries for indicator "ADMI.ENDOFLOWERSEC.MAT" and "ADMI.ENDOFLOWERSEC.READ" for the country with the country code "ZWE" from 2014 to 2021. The dataset appears to track specific metrics or indicators over time for different countries.\'; column_name:\'country_id\'; examples: [\'ZWE\', \'ZWE\', \'ZWE\', \'ZWE\', \'ZWE\', \'ZWE\', \'ZWE\', \'ZWE\', \'ZWE\', \'ZWE\', \'ZWE\']'}] | #country+code | #country+code | #country | TRUE | #country+code | ||||||||||||||||||
77 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/COVID-19 pandemic Attacks on Health Care in 20203.xlsx'; dataset_description='The dataset contains information on attacks on health care during the COVID-19 pandemic in 2020. It includes details such as event number, date, country, COVID-19 event type, conflict event type, perpetrator category, weapons used, and various impacts on health workers such as killings, kidnappings, arrests, threats, injuries, assaults, and sexual violence. The data shows incidents in countries like Sudan, Syria, Yemen, Palestine, Democratic Republic of Congo, and Libya, involving different types of conflict events and perpetrators.'; column_name:'ISO3 codes'; examples: ['SUD', 'SYR', 'YEM', 'PSE', 'COD', 'COD', 'COD', 'COD', 'LBY', 'LBY', 'LBY']"}] | #country+code | #country+code | #country | TRUE | #country+code | ||||||||||||||||||
78 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/COVID-19 pandemic Attacks on Health Care in 20203.xlsx'; dataset_description='The dataset contains information on attacks on health care during the COVID-19 pandemic in 2020. It includes details such as event number, date, country, COVID-19 event type, conflict event type, perpetrator category, weapons used, and various impacts on health workers such as killings, kidnappings, arrests, threats, injuries, assaults, and sexual violence. The data shows incidents in countries like Sudan, Syria, Yemen, Palestine, Democratic Republic of Congo, and Libya, involving different types of conflict events and perpetrators.'; column_name:'Country'; examples: ['Sudan', 'Syria', 'Yemen', 'OPT', 'DRC', 'DRC', 'DRC', 'DRC', 'Libya', 'Libya', 'Libya']"}] | #country+name | #country+name | #country | TRUE | #country+name | ||||||||||||||||||
79 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/FieldsData_3W_PHL_Aklan3.xlsx'; dataset_description='nan'; column_name:'Source'; examples: ['Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data', 'Fields Data']"}] | #meta+source | #meta+source | #meta | TRUE | #meta+source | ||||||||||||||||||
80 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': 'What are the HXL tags and attributes for a column with these details? resource_name=\'/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/FieldsData_3W_PHL_Aklan3.xlsx\'; dataset_description=\'nan\'; column_name:\'Organisation Name\'; examples: [\'Disaster Risk Reduction Network Philippines (DRRNet)\', \'Disaster Risk Reduction Network Philippines (DRRNet)\', \'Akbayanihan Foundation\', \'Western Visayas Network of NGOs (WEVNet)\', \'Western Visayas Network of NGOs (WEVNet)\', \'RealLIFE Foundation, Inc.\', \'Uswag Development Foundation, Inc.\', \'Uswag Development Foundation, Inc.\', \'Uswag Development Foundation, Inc.\', \'GRF Hublag Foundation, Inc.\', "Consortium for People\'s Development - Disaster Response"]'}] | #org+impl | #org+name | #org | FALSE | Scenario 6 - labelled correct 'impl', prediction uses also correct 'name' | #org+name | |||||||||||||||||
81 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/FieldsData_3W_PHL_Aklan3.xlsx'; dataset_description='nan'; column_name:'Organisation Type'; examples: ['National NGO', 'National NGO', 'Private organization', 'Private organization', 'Private organization', 'National NGO', 'Private organization', 'Private organization', 'Private organization', 'Private organization', 'Private organization']"}] | #org+type | #org+type | #org | TRUE | #org+type | ||||||||||||||||||
82 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/FieldsData_3W_PHL_Aklan3.xlsx'; dataset_description='nan'; column_name:'Region'; examples: ['Southeast Asia', 'Southeast Asia', 'Southeast Asia', 'Southeast Asia', 'Southeast Asia', 'Southeast Asia', 'Southeast Asia', 'Southeast Asia', 'Southeast Asia', 'Southeast Asia', 'Southeast Asia']"}] | #region+name | #region+name | #region | TRUE | #region+name | ||||||||||||||||||
83 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/FieldsData_3W_PHL_Aklan3.xlsx'; dataset_description='nan'; column_name:'Country'; examples: ['Philippines', 'Philippines', 'Philippines', 'Philippines', 'Philippines', 'Philippines', 'Philippines', 'Philippines', 'Philippines', 'Philippines', 'Philippines']"}] | #adm1+name | #country+name | #adm1 | FALSE | Scenario 2 - labelled 'adm1', predicted 'country' (admin 0) | #country+name | |||||||||||||||||
84 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/FieldsData_3W_PHL_Aklan3.xlsx'; dataset_description='nan'; column_name:'Location'; examples: ['Aklan', 'Aklan', 'Aklan', 'Aklan', 'Aklan', 'Aklan', 'Aklan', 'Aklan', 'Aklan', 'Aklan', 'Aklan']"}] | #adm2+name | #adm1+name | #adm2 | FALSE | Scenario 7 - admin level differences, needs more analysis | #adm2+name | |||||||||||||||||
85 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/FieldsData_3W_PHL_Aklan3.xlsx'; dataset_description='nan'; column_name:'Sector'; examples: ['Education', 'Disaster Risk Reduction', 'Livelihoods', 'Education', 'Disaster Risk Reduction', 'Education', 'Livelihoods', 'Health', 'Nutrition', 'Livelihoods', 'Education']"}] | #sector+name | #sector | #sector | FALSE | Scenario 5 - labelled has extra correct attribute prediction doesn't (eg 'code') | #sector+name | |||||||||||||||||
86 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/Original Google Sheet3.google sheet'; dataset_description='nan'; column_name:'Release status'; examples: ['Released', 'Released', 'Released', 'Released', 'Released', 'Released', 'Released', 'Released', 'Released', 'Released', 'Released']"}] | #status | #status | #status | TRUE | #status+code | ||||||||||||||||||
87 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv'; dataset_description='The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.'; column_name:'aid'; examples: ['XM-DAC-41114-OUTPUT-00048714', 'XM-DAC-41114-PROJECT-00042380', '47122-NPL', 'CH-FDJP-CHE110141200-00', 'XI-IATI-UNPF-17-RR-CEF-084', 'XI-IATI-UNPF-17-RR-WFP-049', 'XI-IATI-UNPF-17-RR-WFP-048', 'XI-IATI-UNPF-17-RR-UDP-009', 'XI-IATI-UNPF-17-RR-IOM-031', 'XI-IATI-UNPF-17-RR-FPA-043', 'XI-IATI-UNPF-17-RR-FPA-042']"}] | #activity+id | #activity+id | #activity | TRUE | #activity+code | ||||||||||||||||||
88 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv'; dataset_description='The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.'; column_name:'reporting'; examples: ['United Nations Development Programme', 'United Nations Development Programme', 'Gavi, The Vaccine Alliance', 'Drugs for Neglected Diseases initiative', 'UN Pooled Funds', 'UN Pooled Funds', 'UN Pooled Funds', 'UN Pooled Funds', 'UN Pooled Funds', 'UN Pooled Funds', 'UN Pooled Funds']"}] | #org+name+reporting | #org+reporting | #org | FALSE | #org+name+reporting | ||||||||||||||||||
89 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv'; dataset_description='The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.'; column_name:'reporting_ref'; examples: ['XM-DAC-41114', 'XM-DAC-41114', '47122', 'CH-FDJP-CHE110141200', 'XI-IATI-UNPF', 'XI-IATI-UNPF', 'XI-IATI-UNPF', 'XI-IATI-UNPF', 'XI-IATI-UNPF', 'XI-IATI-UNPF', 'XI-IATI-UNPF']"}] | #org+id+reporting | #org | #org | FALSE | #org+id+reporting | ||||||||||||||||||
90 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv'; dataset_description='The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.'; column_name:'funder_ref'; examples: ['UNDP', 'UNDP', 'GAVI', 'CH-FDJP-CHE110141200', 'XI-IATI-UNPF', 'XI-IATI-UNPF', 'XI-IATI-UNPF', 'XI-IATI-UNPF', 'XI-IATI-UNPF', 'XI-IATI-UNPF', 'XI-IATI-UNPF']"}] | #org+funder+id | #org+funder+code | #org | FALSE | #org+funder+id | ||||||||||||||||||
91 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv'; dataset_description='The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.'; column_name:'status_code'; examples: ['Implementation', 'Implementation', 'Implementation', 'Implementation', 'Implementation', 'Implementation', 'Implementation', 'Implementation', 'Implementation', 'Implementation', 'Implementation']"}] | #status | #status+code | #status | FALSE | Scenario 3 - prediction adds extra correct attribute (eg 'name', 'code') | #status+code | |||||||||||||||||
92 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv'; dataset_description='The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.'; column_name:'day_start'; examples: ['2000-01-01', '2000-01-01', '2002-01-01', '2003-01-01', '2005-12-15', '2005-12-15', '2005-12-15', '2005-12-15', '2005-12-15', '2005-12-15', '2005-12-15']"}] | #date+start | #date+start | #date | TRUE | #date+start | ||||||||||||||||||
93 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv'; dataset_description='The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.'; column_name:'day_end'; examples: ['2025-12-31', '2025-12-31', '2027-12-31', '2028-12-31', '2030-12-31', '2030-12-31', '2030-12-31', '2030-12-31', '2030-12-31', '2030-12-31', '2030-12-31']"}] | #date+end | #date+end | #date | TRUE | #date+end | ||||||||||||||||||
94 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': 'What are the HXL tags and attributes for a column with these details? resource_name=\'/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv\'; dataset_description=\'The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.\'; column_name:\'description\'; examples: [\'Programme Effectiveness - UN C\', \'Management plan. Ensure that all anticipated programmatic and operational costs, including development effectiveness and implementation support arrangements are identified, fully costed in the budget.\', "Parent Activity of Gavi\'s Support to Nepal At this level, Joint Appraisal, Country Multi Year Plan, Annual Progress Report are provided as supporting documents. In 2020/2021, as a result of the COVID-19 pandemic, Multi-stakeholder dialogue (MSD) documents temporarily replaced the traditional Joint Appraisal to ensure that Gavi’s continuing support to the EPI programme be aligned with realities at country level. For details on each vaccine please refer to child activities.", \'Established in 2003 in Geneva, Switzerland, DNDi’s headquarters is active in Research & Development activities, as well as in administrative and support functions, including Finance, Human Resources, IT, Policy, Advocacy, Communications and External Relations.\', \'Intensification of immunization activity for the flood-affected people in Nepal\', \'Providing lifesaving support to women and children (girls and boys) directly affected by floods in Nepal\', \'Emergency cash distribution to the most vulnerable food insecure populations in four Tarai districts severely affected by flooding\', \'Safe disposal of disaster waste and essential community infrastructure rehabilitation\', \'Emergency shelter/non-food item support for populations affected by 2017 Flood in Terai Districts of Nepal\', \'Ensuring Lifesaving Sexual and Reproductive Health (SRH) services through mobile RH clinics\', \'Mitigating the impact of flood and displacement on women and girls through protection from violence and exploitation.\']'}] | #description | #activity | #description | FALSE | #description | ||||||||||||||||||
95 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv'; dataset_description='The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.'; column_name:'country_code'; examples: ['Nepal', 'Nepal', 'Nepal', 'Nepal', 'Nepal', 'Nepal', 'Nepal', 'Nepal', 'Nepal', 'Nepal', 'Nepal']"}] | #country+name | #country+name | #country | TRUE | #country+code | ||||||||||||||||||
96 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv'; dataset_description='The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.'; column_name:'sector_group'; examples: ['Unallocated / Unspecified', 'Unallocated / Unspecified', 'Basic Health', 'Health, General', '', '', '', '', '', '', '']"}] | #sector | #sector+name | #sector | FALSE | Scenario 3 - prediction adds extra correct attribute (eg 'name', 'code') | #sector+name | |||||||||||||||||
97 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv'; dataset_description='The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.'; column_name:'sector_code'; examples: ['Sectors not specified', 'Sectors not specified', 'Infectious disease control', '', '', '', '', '', '', '', '']"}] | #subsector | #sector+code | #subsector | FALSE | #subsector | ||||||||||||||||||
98 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/IATI activities in Nepal3.csv'; dataset_description='The dataset contains information on various aid activities in Nepal, including details such as activity ID, reporting organizations, start and end dates, descriptions, funding amounts in different currencies, country allocation percentages, sector information, and location details. The activities are implemented by organizations like the United Nations Development Programme, Gavi, The Vaccine Alliance, Drugs for Neglected Diseases initiative, and UN Pooled Funds. The dataset also includes links to additional information for each activity.'; column_name:'activity_id'; examples: ['http://d-portal.org/q.html?aid=XM-DAC-41114-OUTPUT-00048714', 'http://d-portal.org/q.html?aid=XM-DAC-41114-PROJECT-00042380', 'http://d-portal.org/q.html?aid=47122-NPL', 'http://d-portal.org/q.html?aid=CH-FDJP-CHE110141200-00', 'http://d-portal.org/q.html?aid=XI-IATI-UNPF-17-RR-CEF-084', 'http://d-portal.org/q.html?aid=XI-IATI-UNPF-17-RR-WFP-049', 'http://d-portal.org/q.html?aid=XI-IATI-UNPF-17-RR-WFP-048', 'http://d-portal.org/q.html?aid=XI-IATI-UNPF-17-RR-UDP-009', 'http://d-portal.org/q.html?aid=XI-IATI-UNPF-17-RR-IOM-031', 'http://d-portal.org/q.html?aid=XI-IATI-UNPF-17-RR-FPA-043', 'http://d-portal.org/q.html?aid=XI-IATI-UNPF-17-RR-FPA-042']"}] | #activity+url | #activity+id | #activity | FALSE | #activity+url | ||||||||||||||||||
99 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/Child_protection_area_of_responsibility_organizations_hxl3.xlsx'; dataset_description='The dataset contains information related to child protection projects in the occupied Palestinian territory under the Humanitarian Response Plan 2022. It includes details such as project names, requested funding, target numbers, cluster names, governing entities, and organization names and types. Various international NGOs are involved in providing services such as child protection, mental health, and psychosocial support to vulnerable children and families affected by conflict-related violence and gender-based violence in different regions of the West Bank and Gaza Strip.'; column_name:'plan_id'; examples: [1059, 1059, 1059, 1059, 1059, 1059, 1059, 1059, 1059, 1059, 1059]"}] | #activity+id | #activity | FALSE | Prediction blank | #activity+id | ||||||||||||||||||
100 | [{'role': 'system', 'content': '\n You are an assistant that replies with HXL tags and attributes"\n '}, {'role': 'user', 'content': "What are the HXL tags and attributes for a column with these details? resource_name='/content/drive/MyDrive/Colab/hxl-metadata-prediction/data/Child_protection_area_of_responsibility_organizations_hxl3.xlsx'; dataset_description='The dataset contains information related to child protection projects in the occupied Palestinian territory under the Humanitarian Response Plan 2022. It includes details such as project names, requested funding, target numbers, cluster names, governing entities, and organization names and types. Various international NGOs are involved in providing services such as child protection, mental health, and psychosocial support to vulnerable children and families affected by conflict-related violence and gender-based violence in different regions of the West Bank and Gaza Strip.'; column_name:'Plan name'; examples: ['occupied Palestinian territory Humanitarian Response Plan 2022', 'occupied Palestinian territory Humanitarian Response Plan 2022', 'occupied Palestinian territory Humanitarian Response Plan 2022', 'occupied Palestinian territory Humanitarian Response Plan 2022', 'occupied Palestinian territory Humanitarian Response Plan 2022', 'occupied Palestinian territory Humanitarian Response Plan 2022', 'occupied Palestinian territory Humanitarian Response Plan 2022', 'occupied Palestinian territory Humanitarian Response Plan 2022', 'occupied Palestinian territory Humanitarian Response Plan 2022', 'occupied Palestinian territory Humanitarian Response Plan 2022', 'occupied Palestinian territory Humanitarian Response Plan 2022']"}] | #activity+name | #activity | FALSE | Prediction blank | #activity+name |