Doc styler examples (#14953)

* Fix bad examples * Add black formatting to style_doc * Use first nonempty line * Put it at the right place * Don't add spaces to empty lines * Better templates * Deal with triple quotes in docstrings * Result of style_doc * Enable mdx treatment and fix code examples in MDXs * Result of doc styler on doc source files * Last fixes * Break copy from
2021-12-27 19:07:46 -05:00
parent e13f72fbff
commit b5e2b183af
211 changed files with 2738 additions and 1711 deletions
--- a/docs/source/model_doc/tapas.mdx
+++ b/docs/source/model_doc/tapas.mdx
@@ -75,28 +75,28 @@ dependency in case you're using Tensorflow:
 >>> from transformers import TapasConfig, TapasForQuestionAnswering

 >>> # for example, the base sized model with default SQA configuration
->>> model = TapasForQuestionAnswering.from_pretrained('google/tapas-base')
+>>> model = TapasForQuestionAnswering.from_pretrained("google/tapas-base")

 >>> # or, the base sized model with WTQ configuration
->>> config = TapasConfig.from_pretrained('google/tapas-base-finetuned-wtq')
->>> model = TapasForQuestionAnswering.from_pretrained('google/tapas-base', config=config)
+>>> config = TapasConfig.from_pretrained("google/tapas-base-finetuned-wtq")
+>>> model = TapasForQuestionAnswering.from_pretrained("google/tapas-base", config=config)

 >>> # or, the base sized model with WikiSQL configuration
->>> config = TapasConfig('google-base-finetuned-wikisql-supervised')
->>> model = TapasForQuestionAnswering.from_pretrained('google/tapas-base', config=config)
+>>> config = TapasConfig("google-base-finetuned-wikisql-supervised")
+>>> model = TapasForQuestionAnswering.from_pretrained("google/tapas-base", config=config)
 ===PT-TF-SPLIT===
 >>> from transformers import TapasConfig, TFTapasForQuestionAnswering

 >>> # for example, the base sized model with default SQA configuration
->>> model = TFTapasForQuestionAnswering.from_pretrained('google/tapas-base')
+>>> model = TFTapasForQuestionAnswering.from_pretrained("google/tapas-base")

 >>> # or, the base sized model with WTQ configuration
->>> config = TapasConfig.from_pretrained('google/tapas-base-finetuned-wtq')
->>> model = TFTapasForQuestionAnswering.from_pretrained('google/tapas-base', config=config)
+>>> config = TapasConfig.from_pretrained("google/tapas-base-finetuned-wtq")
+>>> model = TFTapasForQuestionAnswering.from_pretrained("google/tapas-base", config=config)

 >>> # or, the base sized model with WikiSQL configuration
->>> config = TapasConfig('google-base-finetuned-wikisql-supervised')
->>> model = TFTapasForQuestionAnswering.from_pretrained('google/tapas-base', config=config)
+>>> config = TapasConfig("google-base-finetuned-wikisql-supervised")
+>>> model = TFTapasForQuestionAnswering.from_pretrained("google/tapas-base", config=config)
 ```

 Of course, you don't necessarily have to follow one of these three ways in which TAPAS was fine-tuned. You can also experiment by defining any hyperparameters you want when initializing [`TapasConfig`], and then create a [`TapasForQuestionAnswering`] based on that configuration. For example, if you have a dataset that has both conversational questions and questions that might involve aggregation, then you can do it this way. Here's an example:
@@ -107,14 +107,14 @@ Of course, you don't necessarily have to follow one of these three ways in which
 >>> # you can initialize the classification heads any way you want (see docs of TapasConfig)
 >>> config = TapasConfig(num_aggregation_labels=3, average_logits_per_cell=True)
 >>> # initializing the pre-trained base sized model with our custom classification heads
->>> model = TapasForQuestionAnswering.from_pretrained('google/tapas-base', config=config)
+>>> model = TapasForQuestionAnswering.from_pretrained("google/tapas-base", config=config)
 ===PT-TF-SPLIT===
 >>> from transformers import TapasConfig, TFTapasForQuestionAnswering

 >>> # you can initialize the classification heads any way you want (see docs of TapasConfig)
 >>> config = TapasConfig(num_aggregation_labels=3, average_logits_per_cell=True)
 >>> # initializing the pre-trained base sized model with our custom classification heads
->>> model = TFTapasForQuestionAnswering.from_pretrained('google/tapas-base', config=config)
+>>> model = TFTapasForQuestionAnswering.from_pretrained("google/tapas-base", config=config)
 ```

 What you can also do is start from an already fine-tuned checkpoint. A note here is that the already fine-tuned checkpoint on WTQ has some issues due to the L2-loss which is somewhat brittle. See [here](https://github.com/google-research/tapas/issues/91#issuecomment-735719340) for more info.
@@ -154,15 +154,26 @@ inputs to be fine-tuned:
 >>> from transformers import TapasTokenizer
 >>> import pandas as pd

->>> model_name = 'google/tapas-base'
+>>> model_name = "google/tapas-base"
 >>> tokenizer = TapasTokenizer.from_pretrained(model_name)

->>> data = {'Actors': ["Brad Pitt", "Leonardo Di Caprio", "George Clooney"], 'Number of movies': ["87", "53", "69"]}
->>> queries = ["What is the name of the first actor?", "How many movies has George Clooney played in?", "What is the total number of movies?"]
+>>> data = {"Actors": ["Brad Pitt", "Leonardo Di Caprio", "George Clooney"], "Number of movies": ["87", "53", "69"]}
+>>> queries = [
+...     "What is the name of the first actor?",
+...     "How many movies has George Clooney played in?",
+...     "What is the total number of movies?",
+... ]
 >>> answer_coordinates = [[(0, 0)], [(2, 1)], [(0, 1), (1, 1), (2, 1)]]
 >>> answer_text = [["Brad Pitt"], ["69"], ["209"]]
 >>> table = pd.DataFrame.from_dict(data)
->>> inputs = tokenizer(table=table, queries=queries, answer_coordinates=answer_coordinates, answer_text=answer_text, padding='max_length', return_tensors='pt')
+>>> inputs = tokenizer(
+...     table=table,
+...     queries=queries,
+...     answer_coordinates=answer_coordinates,
+...     answer_text=answer_text,
+...     padding="max_length",
+...     return_tensors="pt",
+... )
 >>> inputs
 {'input_ids': tensor([[ ... ]]), 'attention_mask': tensor([[...]]), 'token_type_ids': tensor([[[...]]]),
 'numeric_values': tensor([[ ... ]]), 'numeric_values_scale: tensor([[ ... ]]), labels: tensor([[ ... ]])}
@@ -170,15 +181,26 @@ inputs to be fine-tuned:
 >>> from transformers import TapasTokenizer
 >>> import pandas as pd

->>> model_name = 'google/tapas-base'
+>>> model_name = "google/tapas-base"
 >>> tokenizer = TapasTokenizer.from_pretrained(model_name)

->>> data = {'Actors': ["Brad Pitt", "Leonardo Di Caprio", "George Clooney"], 'Number of movies': ["87", "53", "69"]}
->>> queries = ["What is the name of the first actor?", "How many movies has George Clooney played in?", "What is the total number of movies?"]
+>>> data = {"Actors": ["Brad Pitt", "Leonardo Di Caprio", "George Clooney"], "Number of movies": ["87", "53", "69"]}
+>>> queries = [
+...     "What is the name of the first actor?",
+...     "How many movies has George Clooney played in?",
+...     "What is the total number of movies?",
+... ]
 >>> answer_coordinates = [[(0, 0)], [(2, 1)], [(0, 1), (1, 1), (2, 1)]]
 >>> answer_text = [["Brad Pitt"], ["69"], ["209"]]
 >>> table = pd.DataFrame.from_dict(data)
->>> inputs = tokenizer(table=table, queries=queries, answer_coordinates=answer_coordinates, answer_text=answer_text, padding='max_length', return_tensors='tf')
+>>> inputs = tokenizer(
+...     table=table,
+...     queries=queries,
+...     answer_coordinates=answer_coordinates,
+...     answer_text=answer_text,
+...     padding="max_length",
+...     return_tensors="tf",
+... )
 >>> inputs
 {'input_ids': tensor([[ ... ]]), 'attention_mask': tensor([[...]]), 'token_type_ids': tensor([[[...]]]),
 'numeric_values': tensor([[ ... ]]), 'numeric_values_scale: tensor([[ ... ]]), labels: tensor([[ ... ]])}
@@ -194,32 +216,37 @@ Of course, this only shows how to encode a single training example. It is advise
 >>> tsv_path = "your_path_to_the_tsv_file"
 >>> table_csv_path = "your_path_to_a_directory_containing_all_csv_files"

+
 >>> class TableDataset(torch.utils.data.Dataset):
 ...     def __init__(self, data, tokenizer):
 ...         self.data = data
 ...         self.tokenizer = tokenizer
-...
+
 ...     def __getitem__(self, idx):
 ...         item = data.iloc[idx]
-...         table = pd.read_csv(table_csv_path + item.table_file).astype(str) # be sure to make your table data text only
-...         encoding = self.tokenizer(table=table, 
-...                                   queries=item.question, 
-...                                   answer_coordinates=item.answer_coordinates, 
-...                                   answer_text=item.answer_text,
-...                                   truncation=True,
-...                                   padding="max_length",
-...                                   return_tensors="pt"
+...         table = pd.read_csv(table_csv_path + item.table_file).astype(
+...             str
+...         )  # be sure to make your table data text only
+...         encoding = self.tokenizer(
+...             table=table,
+...             queries=item.question,
+...             answer_coordinates=item.answer_coordinates,
+...             answer_text=item.answer_text,
+...             truncation=True,
+...             padding="max_length",
+...             return_tensors="pt",
 ...         )
 ...         # remove the batch dimension which the tokenizer adds by default
 ...         encoding = {key: val.squeeze(0) for key, val in encoding.items()}
 ...         # add the float_answer which is also required (weak supervision for aggregation case)
-...         encoding["float_answer"] = torch.tensor(item.float_answer) 
+...         encoding["float_answer"] = torch.tensor(item.float_answer)
 ...         return encoding
-...
-...     def __len__(self):
-...        return len(self.data)

->>> data = pd.read_csv(tsv_path, sep='\t')
+...     def __len__(self):
+...         return len(self.data)
+
+
+>>> data = pd.read_csv(tsv_path, sep="\t")
 >>> train_dataset = TableDataset(data, tokenizer)
 >>> train_dataloader = torch.utils.data.DataLoader(train_dataset, batch_size=32)
 ===PT-TF-SPLIT===
@@ -229,44 +256,50 @@ Of course, this only shows how to encode a single training example. It is advise
 >>> tsv_path = "your_path_to_the_tsv_file"
 >>> table_csv_path = "your_path_to_a_directory_containing_all_csv_files"

+
 >>> class TableDataset:
 ...     def __init__(self, data, tokenizer):
 ...         self.data = data
 ...         self.tokenizer = tokenizer
-...
+
 ...     def __iter__(self):
 ...         for idx in range(self.__len__()):
 ...             item = self.data.iloc[idx]
-...             table = pd.read_csv(table_csv_path + item.table_file).astype(str) # be sure to make your table data text only
-...             encoding = self.tokenizer(table=table, 
-...                                   queries=item.question, 
-...                                   answer_coordinates=item.answer_coordinates, 
-...                                   answer_text=item.answer_text,
-...                                   truncation=True,
-...                                   padding="max_length",
-...                                   return_tensors="tf"
+...             table = pd.read_csv(table_csv_path + item.table_file).astype(
+...                 str
+...             )  # be sure to make your table data text only
+...             encoding = self.tokenizer(
+...                 table=table,
+...                 queries=item.question,
+...                 answer_coordinates=item.answer_coordinates,
+...                 answer_text=item.answer_text,
+...                 truncation=True,
+...                 padding="max_length",
+...                 return_tensors="tf",
 ...             )
 ...             # remove the batch dimension which the tokenizer adds by default
-...             encoding = {key: tf.squeeze(val,0) for key, val in encoding.items()}
+...             encoding = {key: tf.squeeze(val, 0) for key, val in encoding.items()}
 ...             # add the float_answer which is also required (weak supervision for aggregation case)
-...             encoding["float_answer"] = tf.convert_to_tensor(item.float_answer,dtype=tf.float32)
-...             yield encoding['input_ids'], encoding['attention_mask'], encoding['numeric_values'], \
-...                   encoding['numeric_values_scale'], encoding['token_type_ids'], encoding['labels'], \
-...                   encoding['float_answer']
-...
-...     def __len__(self):
-...        return len(self.data)
+...             encoding["float_answer"] = tf.convert_to_tensor(item.float_answer, dtype=tf.float32)
+...             yield encoding["input_ids"], encoding["attention_mask"], encoding["numeric_values"], encoding[
+...                 "numeric_values_scale"
+...             ], encoding["token_type_ids"], encoding["labels"], encoding["float_answer"]

->>> data = pd.read_csv(tsv_path, sep='\t')
+...     def __len__(self):
+...         return len(self.data)
+
+
+>>> data = pd.read_csv(tsv_path, sep="\t")
 >>> train_dataset = TableDataset(data, tokenizer)
 >>> output_signature = (
-... tf.TensorSpec(shape=(512,), dtype=tf.int32),
-... tf.TensorSpec(shape=(512,), dtype=tf.int32),
-... tf.TensorSpec(shape=(512,), dtype=tf.float32),
-... tf.TensorSpec(shape=(512,), dtype=tf.float32),
-... tf.TensorSpec(shape=(512,7), dtype=tf.int32),
-... tf.TensorSpec(shape=(512,), dtype=tf.int32),
-... tf.TensorSpec(shape=(512,), dtype=tf.float32))
+...     tf.TensorSpec(shape=(512,), dtype=tf.int32),
+...     tf.TensorSpec(shape=(512,), dtype=tf.int32),
+...     tf.TensorSpec(shape=(512,), dtype=tf.float32),
+...     tf.TensorSpec(shape=(512,), dtype=tf.float32),
+...     tf.TensorSpec(shape=(512, 7), dtype=tf.int32),
+...     tf.TensorSpec(shape=(512,), dtype=tf.int32),
+...     tf.TensorSpec(shape=(512,), dtype=tf.float32),
+... )
 >>> train_dataloader = tf.data.Dataset.from_generator(train_dataset, output_signature=output_signature).batch(32)
 ```

@@ -282,15 +315,15 @@ You can then fine-tune [`TapasForQuestionAnswering`] or [`TFTapasForQuestionAnsw

 >>> # this is the default WTQ configuration
 >>> config = TapasConfig(
-...            num_aggregation_labels = 4,
-...            use_answer_as_supervision = True,
-...            answer_loss_cutoff = 0.664694,
-...            cell_selection_preference = 0.207951,
-...            huber_loss_delta = 0.121194,
-...            init_cell_selection_weights_to_zero = True,
-...            select_one_column = True,
-...            allow_empty_column_selection = False,
-...            temperature = 0.0352513,
+...     num_aggregation_labels=4,
+...     use_answer_as_supervision=True,
+...     answer_loss_cutoff=0.664694,
+...     cell_selection_preference=0.207951,
+...     huber_loss_delta=0.121194,
+...     init_cell_selection_weights_to_zero=True,
+...     select_one_column=True,
+...     allow_empty_column_selection=False,
+...     temperature=0.0352513,
 ... )
 >>> model = TapasForQuestionAnswering.from_pretrained("google/tapas-base", config=config)

@@ -298,8 +331,8 @@ You can then fine-tune [`TapasForQuestionAnswering`] or [`TFTapasForQuestionAnsw

 >>> model.train()
 >>> for epoch in range(2):  # loop over the dataset multiple times
-...    for batch in train_dataloader:
-...         # get the inputs; 
+...     for batch in train_dataloader:
+...         # get the inputs;
 ...         input_ids = batch["input_ids"]
 ...         attention_mask = batch["attention_mask"]
 ...         token_type_ids = batch["token_type_ids"]
@@ -312,9 +345,15 @@ You can then fine-tune [`TapasForQuestionAnswering`] or [`TFTapasForQuestionAnsw
 ...         optimizer.zero_grad()

 ...         # forward + backward + optimize
-...         outputs = model(input_ids=input_ids, attention_mask=attention_mask, token_type_ids=token_type_ids, 
-...                        labels=labels, numeric_values=numeric_values, numeric_values_scale=numeric_values_scale, 
-...                        float_answer=float_answer)
+...         outputs = model(
+...             input_ids=input_ids,
+...             attention_mask=attention_mask,
+...             token_type_ids=token_type_ids,
+...             labels=labels,
+...             numeric_values=numeric_values,
+...             numeric_values_scale=numeric_values_scale,
+...             float_answer=float_answer,
+...         )
 ...         loss = outputs.loss
 ...         loss.backward()
 ...         optimizer.step()
@@ -324,23 +363,23 @@ You can then fine-tune [`TapasForQuestionAnswering`] or [`TFTapasForQuestionAnsw

 >>> # this is the default WTQ configuration
 >>> config = TapasConfig(
-...            num_aggregation_labels = 4,
-...            use_answer_as_supervision = True,
-...            answer_loss_cutoff = 0.664694,
-...            cell_selection_preference = 0.207951,
-...            huber_loss_delta = 0.121194,
-...            init_cell_selection_weights_to_zero = True,
-...            select_one_column = True,
-...            allow_empty_column_selection = False,
-...            temperature = 0.0352513,
+...     num_aggregation_labels=4,
+...     use_answer_as_supervision=True,
+...     answer_loss_cutoff=0.664694,
+...     cell_selection_preference=0.207951,
+...     huber_loss_delta=0.121194,
+...     init_cell_selection_weights_to_zero=True,
+...     select_one_column=True,
+...     allow_empty_column_selection=False,
+...     temperature=0.0352513,
 ... )
 >>> model = TFTapasForQuestionAnswering.from_pretrained("google/tapas-base", config=config)

 >>> optimizer = tf.keras.optimizers.Adam(learning_rate=5e-5)

 >>> for epoch in range(2):  # loop over the dataset multiple times
-...    for batch in train_dataloader:
-...         # get the inputs; 
+...     for batch in train_dataloader:
+...         # get the inputs;
 ...         input_ids = batch[0]
 ...         attention_mask = batch[1]
 ...         token_type_ids = batch[4]
@@ -351,9 +390,15 @@ You can then fine-tune [`TapasForQuestionAnswering`] or [`TFTapasForQuestionAnsw

 ...         # forward + backward + optimize
 ...         with tf.GradientTape() as tape:
-...              outputs = model(input_ids=input_ids, attention_mask=attention_mask, token_type_ids=token_type_ids, 
-...                        labels=labels, numeric_values=numeric_values, numeric_values_scale=numeric_values_scale, 
-...                        float_answer=float_answer )
+...             outputs = model(
+...                 input_ids=input_ids,
+...                 attention_mask=attention_mask,
+...                 token_type_ids=token_type_ids,
+...                 labels=labels,
+...                 numeric_values=numeric_values,
+...                 numeric_values_scale=numeric_values_scale,
+...                 float_answer=float_answer,
+...             )
 ...         grads = tape.gradient(outputs.loss, model.trainable_weights)
 ...         optimizer.apply_gradients(zip(grads, model.trainable_weights))
 ```
@@ -366,47 +411,49 @@ However, note that inference is **different** depending on whether or not the se

 ```py
 >>> from transformers import TapasTokenizer, TapasForQuestionAnswering
->>> import pandas as pd 
+>>> import pandas as pd

->>> model_name = 'google/tapas-base-finetuned-wtq'
+>>> model_name = "google/tapas-base-finetuned-wtq"
 >>> model = TapasForQuestionAnswering.from_pretrained(model_name)
 >>> tokenizer = TapasTokenizer.from_pretrained(model_name)

->>> data = {'Actors': ["Brad Pitt", "Leonardo Di Caprio", "George Clooney"], 'Number of movies': ["87", "53", "69"]}
->>> queries = ["What is the name of the first actor?", "How many movies has George Clooney played in?", "What is the total number of movies?"]
+>>> data = {"Actors": ["Brad Pitt", "Leonardo Di Caprio", "George Clooney"], "Number of movies": ["87", "53", "69"]}
+>>> queries = [
+...     "What is the name of the first actor?",
+...     "How many movies has George Clooney played in?",
+...     "What is the total number of movies?",
+... ]
 >>> table = pd.DataFrame.from_dict(data)
->>> inputs = tokenizer(table=table, queries=queries, padding='max_length', return_tensors="pt") 
+>>> inputs = tokenizer(table=table, queries=queries, padding="max_length", return_tensors="pt")
 >>> outputs = model(**inputs)
 >>> predicted_answer_coordinates, predicted_aggregation_indices = tokenizer.convert_logits_to_predictions(
-...         inputs, 
-...         outputs.logits.detach(), 
-...         outputs.logits_aggregation.detach()
+...     inputs, outputs.logits.detach(), outputs.logits_aggregation.detach()
 ... )

 >>> # let's print out the results:
->>> id2aggregation = {0: "NONE", 1: "SUM", 2: "AVERAGE", 3:"COUNT"}
+>>> id2aggregation = {0: "NONE", 1: "SUM", 2: "AVERAGE", 3: "COUNT"}
 >>> aggregation_predictions_string = [id2aggregation[x] for x in predicted_aggregation_indices]

 >>> answers = []
 >>> for coordinates in predicted_answer_coordinates:
-...   if len(coordinates) == 1:
-...     # only a single cell:
-...     answers.append(table.iat[coordinates[0]])
-...   else:
-...     # multiple cells
-...     cell_values = []
-...     for coordinate in coordinates:
-...        cell_values.append(table.iat[coordinate])
-...     answers.append(", ".join(cell_values))
+...     if len(coordinates) == 1:
+...         # only a single cell:
+...         answers.append(table.iat[coordinates[0]])
+...     else:
+...         # multiple cells
+...         cell_values = []
+...         for coordinate in coordinates:
+...             cell_values.append(table.iat[coordinate])
+...         answers.append(", ".join(cell_values))

 >>> display(table)
 >>> print("")
 >>> for query, answer, predicted_agg in zip(queries, answers, aggregation_predictions_string):
-...   print(query)
-...   if predicted_agg == "NONE":
-...     print("Predicted answer: " + answer)
-...   else:
-...     print("Predicted answer: " + predicted_agg + " > " + answer)    
+...     print(query)
+...     if predicted_agg == "NONE":
+...         print("Predicted answer: " + answer)
+...     else:
+...         print("Predicted answer: " + predicted_agg + " > " + answer)
 What is the name of the first actor?
 Predicted answer: Brad Pitt
 How many movies has George Clooney played in?
@@ -415,47 +462,49 @@ What is the total number of movies?
 Predicted answer: SUM > 87, 53, 69
 ===PT-TF-SPLIT===
 >>> from transformers import TapasTokenizer, TFTapasForQuestionAnswering
->>> import pandas as pd 
+>>> import pandas as pd

->>> model_name = 'google/tapas-base-finetuned-wtq'
+>>> model_name = "google/tapas-base-finetuned-wtq"
 >>> model = TFTapasForQuestionAnswering.from_pretrained(model_name)
 >>> tokenizer = TapasTokenizer.from_pretrained(model_name)

->>> data = {'Actors': ["Brad Pitt", "Leonardo Di Caprio", "George Clooney"], 'Number of movies': ["87", "53", "69"]}
->>> queries = ["What is the name of the first actor?", "How many movies has George Clooney played in?", "What is the total number of movies?"]
+>>> data = {"Actors": ["Brad Pitt", "Leonardo Di Caprio", "George Clooney"], "Number of movies": ["87", "53", "69"]}
+>>> queries = [
+...     "What is the name of the first actor?",
+...     "How many movies has George Clooney played in?",
+...     "What is the total number of movies?",
+... ]
 >>> table = pd.DataFrame.from_dict(data)
->>> inputs = tokenizer(table=table, queries=queries, padding='max_length', return_tensors="tf") 
+>>> inputs = tokenizer(table=table, queries=queries, padding="max_length", return_tensors="tf")
 >>> outputs = model(**inputs)
 >>> predicted_answer_coordinates, predicted_aggregation_indices = tokenizer.convert_logits_to_predictions(
-...         inputs, 
-...         outputs.logits, 
-...         outputs.logits_aggregation
+...     inputs, outputs.logits, outputs.logits_aggregation
 ... )

 >>> # let's print out the results:
->>> id2aggregation = {0: "NONE", 1: "SUM", 2: "AVERAGE", 3:"COUNT"}
+>>> id2aggregation = {0: "NONE", 1: "SUM", 2: "AVERAGE", 3: "COUNT"}
 >>> aggregation_predictions_string = [id2aggregation[x] for x in predicted_aggregation_indices]

 >>> answers = []
 >>> for coordinates in predicted_answer_coordinates:
-...   if len(coordinates) == 1:
-...     # only a single cell:
-...     answers.append(table.iat[coordinates[0]])
-...   else:
-...     # multiple cells
-...     cell_values = []
-...     for coordinate in coordinates:
-...        cell_values.append(table.iat[coordinate])
-...     answers.append(", ".join(cell_values))
+...     if len(coordinates) == 1:
+...         # only a single cell:
+...         answers.append(table.iat[coordinates[0]])
+...     else:
+...         # multiple cells
+...         cell_values = []
+...         for coordinate in coordinates:
+...             cell_values.append(table.iat[coordinate])
+...         answers.append(", ".join(cell_values))

 >>> display(table)
 >>> print("")
 >>> for query, answer, predicted_agg in zip(queries, answers, aggregation_predictions_string):
-...   print(query)
-...   if predicted_agg == "NONE":
-...     print("Predicted answer: " + answer)
-...   else:
-...     print("Predicted answer: " + predicted_agg + " > " + answer)    
+...     print(query)
+...     if predicted_agg == "NONE":
+...         print("Predicted answer: " + answer)
+...     else:
+...         print("Predicted answer: " + predicted_agg + " > " + answer)
 What is the name of the first actor?
 Predicted answer: Brad Pitt
 How many movies has George Clooney played in?