Skip to content

Commit

Permalink
standardize col desc with those in sql files
Browse files Browse the repository at this point in the history
  • Loading branch information
wendy-aw committed Feb 26, 2024
1 parent 799be7f commit 96c2eb6
Showing 1 changed file with 42 additions and 42 deletions.
84 changes: 42 additions & 42 deletions defog_data/supplementary.py
Original file line number Diff line number Diff line change
Expand Up @@ -106,19 +106,19 @@ def load_embeddings(emb_path: str) -> tuple[dict, dict]:
columns_ner = {
"academic": {
"PERSON": [
"author.name,text,The name of the author",
"author.name,text,Name of the author",
],
"ORG": [
"conference.name,text,The name of the conference",
"journal.name,text,The name of the journal",
"organization.name,text,The name of the organization",
"organization.name,text,Name of the organization",
],
},
"advising": {
"PERSON": [
"instructor.name,text,The name of the instructor",
"student.firstname,text,The first name of the student",
"student.lastname,text,The last name of the student",
"instructor.name,text,Name of the instructor",
"student.firstname,text,First name of the student",
"student.lastname,text,Last name of the student",
],
"ORG": [
"program.college,text,Name of the college offering the program",
Expand All @@ -127,81 +127,81 @@ def load_embeddings(emb_path: str) -> tuple[dict, dict]:
},
"atis": {
"GPE": [
"airport_service.city_code,text,The city code where airport service is available",
"airport_service.city_code,text,The code of the city where the airport is located",
"airport.airport_location,text,The location of the airport, eg 'Las Vegas', 'Chicago'",
"airport.country_name,text,The country the airport is located in",
"airport.state_code,text,The state the airport is located in",
"city.city_code,text,The city code",
"city.city_name,text,The city name",
"city.country_name,text,The country name",
"city.state_code,text,The state code",
"ground_service.city_code,text,The city code where ground service is available",
"state.country_name,text,The country name",
"state.state_code,text,The state code",
"state.state_name,text,The state name",
"airport.country_name,text,The name of the country where the airport is located.",
"airport.state_code,text,The code assigned to the state where the airport is located.",
"city.city_code,text,The code assigned to the city",
"city.city_name,text,The name of the city",
"city.country_name,text,The name of the country where the city is located",
"city.state_code,text,The 2-letter code assigned to the state where the city is located. E.g. 'NY', 'CA', etc.",
"ground_service.city_code,text,The code for the city where the ground service is provided",
"state.country_name,text,The name of the country the state belongs to",
"state.state_code,text,The 2-letter code assigned to the state. E.g. 'NY', 'CA', etc.",
"state.state_name,text,The name of the state",
],
"ORG": [
"airline.airline_code,text,Code assigned to airline",
"airline.airline_name,text,The airline's name",
"airport_service.airport_code,text,The airport code where airport service is available",
"airport.airport_code,text,The 3-letter airport code",
"airline.airline_code,text,The code assigned to the airline",
"airline.airline_name,text,The name of the airline",
"airport_service.airport_code,text,The code of the airport",
"airport.airport_code,text,The code assigned to the airport.",
"airport.airport_name,text,The name of the airport",
"dual_carrier.main_airline,text,The name of the main airline operating the flight",
"fare.fare_airline,text,The airline's name",
"fare.fare_airline,text,The airline code associated with this fare",
"fare.from_airport,text,The 3-letter airport code for the departure location",
"fare.to_airport,text,The 3-letter airport code for the arrival location",
"flight.airline_code,text,Code assigned to airline",
"flight.from_airport,text,The 3-letter airport code for the departure location",
"flight.to_airport,text,The 3-letter airport code for the arrival location",
"ground_service.airport_code,text,The airport code where ground service is available",
"flight.airline_code,text,Code assigned to the airline",
"flight.from_airport,text,Code assigned to the departure airport",
"flight.to_airport,text,Code assigned to the arrival airport",
"ground_service.airport_code,text,The 3-letter code for the airport where the ground service is provided",
],
},
"yelp": {
"GPE": [
"business.city,text,The name of the city where the business is located",
"business.state,text,The US state where the business is located. This is represented by two-letter state abbreviations (eg. 'CA', 'NV', 'NY', etc.)",
"business.city,text,The city where the business is located",
"business.state,text,The US state where the business is located, represented by two-letter abbreviations (eg. 'CA', 'NV', 'NY', etc.)",
"business.full_address,text,The full address of the business",
],
"ORG": [
"business.name,text,The name of the business",
"business.name,text,The name of the business. All apostrophes use ’ instead of ' to avoid SQL errors.",
"neighbourhood.neighbourhood_name,text,Name of the neighbourhood where the business is located",
],
"PER": [
"users.name,text,The name of the user",
"users.name,text,Name of the user",
],
},
"restaurants": {
"GPE": [
"location.city_name,text,The city where the restaurant is located",
"location.street_name,text,The street where the restaurant is located",
"geographic.city_name,text,The city where the restaurant is located",
"geographic.county,text,The county where the restaurant is located",
"geographic.region,text,The region where the restaurant is located",
"location.city_name,text,The name of the city where the restaurant is located",
"location.street_name,text,The name of the street where the restaurant is located",
"geographic.city_name,text,The name of the city",
"geographic.county,text,The name of the county",
"geographic.region,text,The name of the region",
"restaurant.city_name,text,The city where the restaurant is located",
],
"ORG": [
"restaurant.name,text,The name of the restaurant",
"restaurant.id,bigint,The ID of the restaurant",
"restaurant.id,bigint,Unique identifier for each restaurant",
],
"PER": [],
},
"geography": {
"GPE": [
"city.city_name,text,The name of the city",
"city.country_name,text,The name of the country",
"city.state_name,text,The name of the state",
"city.country_name,text,The name of the country where the city is located",
"city.state_name,text,The name of the state where the city is located",
"lake.country_name,text,The name of the country where the lake is located",
"lake.state_name,text,The name of the state where the lake is located (if applicable)",
"river.country_name,text,The name of the country where the river flows through",
"river.traverse, text, The cities or landmarks the river passes through. Comma delimited, eg `new york,albany,boston`",
"river.country_name,text,The name of the country the river flows through",
"river.traverse, text, The cities or landmarks the river passes through. Comma delimited and in title case, eg `New York,Albany,Boston`",
"state.state_name,text,The name of the state",
"state.country_name,text,The name of the country the state belongs to",
"state.capital,text,The name of the capital city of the state",
"highlow.state_name,text,The name of the state",
"mountain.country_name,text,The name of the country where the mountain is located",
"mountain.state_name,text,The name of the state where the mountain is located (if applicable)",
"border_info.state_name,text,The name of the state that shares a border with another state or country",
"border_info.border,text,The name of the state or country that shares a border with the state specified in the state_name column",
"mountain.state_name,text,The name of the state or province where the mountain is located (if applicable)",
"border_info.state_name,text,The name of the state that shares a border with another state or country.",
"border_info.border,text,The name of the state that shares a border with the state specified in the state_name column.",
],
"LOC": [
"lake.lake_name,text,The name of the lake",
Expand Down

0 comments on commit 96c2eb6

Please sign in to comment.