import numpy as np 
import pandas as pd
import plotly.express as px

# Uncomment for HTML Export
import plotly.io as pio
pio.renderers.default = "notebook_connected"

# Fetch the Data
import torchvision
data = torchvision.datasets.FashionMNIST(root='data', train=True, download=True)

# Preprocess the data into numpy arrays
images = data.data.numpy().astype(float)
targets = data.targets.numpy() # integer encoding of class labels
class_dict = {i:class_name for i,class_name in enumerate(data.classes)}
labels = np.array([class_dict[t] for t in targets]) # raw class labels
n = len(images)

print("Loaded FashionMNIST dataset with {} samples.".format(n))
print("Classes: {}".format(class_dict))
print("Image shape: {}".format(images[0].shape))
print("Image dtype: {}".format(images[0].dtype))
print("Image 0:\n", images[0])

Loaded FashionMNIST dataset with 60000 samples.
Classes: {0: 'T-shirt/top', 1: 'Trouser', 2: 'Pullover', 3: 'Dress', 4: 'Coat', 5: 'Sandal', 6: 'Shirt', 7: 'Sneaker', 8: 'Bag', 9: 'Ankle boot'}
Image shape: (28, 28)
Image dtype: float64
Image 0:
 [[  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.
    0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.
    0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.
    0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   1.   0.
    0.  13.  73.   0.   0.   1.   4.   0.   0.   0.   0.   1.   1.   0.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   3.   0.
   36. 136. 127.  62.  54.   0.   0.   0.   1.   3.   4.   0.   0.   3.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   6.   0.
  102. 204. 176. 134. 144. 123.  23.   0.   0.   0.   0.  12.  10.   0.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.
  155. 236. 207. 178. 107. 156. 161. 109.  64.  23.  77. 130.  72.  15.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   1.   0.  69.
  207. 223. 218. 216. 216. 163. 127. 121. 122. 146. 141.  88. 172.  66.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   1.   1.   1.   0. 200.
  232. 232. 233. 229. 223. 223. 215. 213. 164. 127. 123. 196. 229.   0.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0. 183.
  225. 216. 223. 228. 235. 227. 224. 222. 224. 221. 223. 245. 173.   0.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0. 193.
  228. 218. 213. 198. 180. 212. 210. 211. 213. 223. 220. 243. 202.   0.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   1.   3.   0.  12. 219.
  220. 212. 218. 192. 169. 227. 208. 218. 224. 212. 226. 197. 209.  52.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   6.   0.  99. 244.
  222. 220. 218. 203. 198. 221. 215. 213. 222. 220. 245. 119. 167.  56.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   4.   0.   0.  55. 236.
  228. 230. 228. 240. 232. 213. 218. 223. 234. 217. 217. 209.  92.   0.]
 [  0.   0.   1.   4.   6.   7.   2.   0.   0.   0.   0.   0. 237. 226.
  217. 223. 222. 219. 222. 221. 216. 223. 229. 215. 218. 255.  77.   0.]
 [  0.   3.   0.   0.   0.   0.   0.   0.   0.  62. 145. 204. 228. 207.
  213. 221. 218. 208. 211. 218. 224. 223. 219. 215. 224. 244. 159.   0.]
 [  0.   0.   0.   0.  18.  44.  82. 107. 189. 228. 220. 222. 217. 226.
  200. 205. 211. 230. 224. 234. 176. 188. 250. 248. 233. 238. 215.   0.]
 [  0.  57. 187. 208. 224. 221. 224. 208. 204. 214. 208. 209. 200. 159.
  245. 193. 206. 223. 255. 255. 221. 234. 221. 211. 220. 232. 246.   0.]
 [  3. 202. 228. 224. 221. 211. 211. 214. 205. 205. 205. 220. 240.  80.
  150. 255. 229. 221. 188. 154. 191. 210. 204. 209. 222. 228. 225.   0.]
 [ 98. 233. 198. 210. 222. 229. 229. 234. 249. 220. 194. 215. 217. 241.
   65.  73. 106. 117. 168. 219. 221. 215. 217. 223. 223. 224. 229.  29.]
 [ 75. 204. 212. 204. 193. 205. 211. 225. 216. 185. 197. 206. 198. 213.
  240. 195. 227. 245. 239. 223. 218. 212. 209. 222. 220. 221. 230.  67.]
 [ 48. 203. 183. 194. 213. 197. 185. 190. 194. 192. 202. 214. 219. 221.
  220. 236. 225. 216. 199. 206. 186. 181. 177. 172. 181. 205. 206. 115.]
 [  0. 122. 219. 193. 179. 171. 183. 196. 204. 210. 213. 207. 211. 210.
  200. 196. 194. 191. 195. 191. 198. 192. 176. 156. 167. 177. 210.  92.]
 [  0.   0.  74. 189. 212. 191. 175. 172. 175. 181. 185. 188. 189. 188.
  193. 198. 204. 209. 210. 210. 211. 188. 188. 194. 192. 216. 170.   0.]
 [  2.   0.   0.   0.  66. 200. 222. 237. 239. 242. 246. 243. 244. 221.
  220. 193. 191. 179. 182. 182. 181. 176. 166. 168.  99.  58.   0.   0.]
 [  0.   0.   0.   0.   0.   0.   0.  40.  61.  44.  72.  41.  35.   0.
    0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.
    0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.]
 [  0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.
    0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.   0.]]

images.shape

(60000, 28, 28)

counts, bins =  np.histogram(images, bins=255)
fig_pixels = px.bar(x=bins[1:], y=counts,  title="Pixel value distribution", 
       log_y=True, labels={"x":"Pixel value", "y":"Count"})
fig_pixels

px.imshow(images[0], color_continuous_scale='gray_r')

def show_images(images, max_images=40, ncols=5, labels = None):
    """Visualize a subset of images from the dataset.
    Args:
        images (np.ndarray): Array of images to visualize [img,row,col].
        max_images (int): Maximum number of images to display.
        ncols (int): Number of columns in the grid.
        labels (np.ndarray, optional): Labels for the images, used for facet titles.
    Returns:
        plotly.graph_objects.Figure: A Plotly figure object containing the images.
    """
    n = min(images.shape[0], max_images) # number of images to show
    px_height = 220 # height of each image in pixels
    fig = px.imshow(images[:n, :, :], color_continuous_scale='gray_r', 
                    facet_col = 0, facet_col_wrap=ncols,
                    height = px_height * int(np.ceil(n/ncols)))
    fig.update_layout(coloraxis_showscale=False)
    if labels is not None:
        # Extract the facet number and replace with the label.
        fig.for_each_annotation(lambda a: a.update(text=labels[int(a.text.split("=")[-1])]))
    return fig

show_images(images, 20, labels=labels)

idx = (
    pd.DataFrame({"labels": labels})
      .groupby("labels", as_index=False)
      .sample(2)
      .index
      .to_numpy())
show_images(images[idx,:,:], labels=labels[idx])

labels

array(['Ankle boot', 'T-shirt/top', 'T-shirt/top', ..., 'Dress',
       'T-shirt/top', 'Sandal'], shape=(60000,), dtype='<U11')

px.histogram(labels, title="Label distribution")

# use sklearn to construct a train test split
from sklearn.model_selection import train_test_split

# Construct the train - test split
images_tr, images_te, labels_tr, labels_te = train_test_split(
    images, labels, test_size=0.2, random_state=42)

# Construct the train - validation split
images_tr, images_val, labels_tr, labels_val = train_test_split(
    images_tr, labels_tr, test_size=0.2, random_state=42)

print("images_tr shape:", images_tr.shape)
print("images_val shape:", images_val.shape)
print("images_te shape:", images_te.shape)

images_tr shape: (38400, 28, 28)
images_val shape: (9600, 28, 28)
images_te shape: (12000, 28, 28)

images_tr.shape

(38400, 28, 28)

def flatten(images):
    return images.reshape(images.shape[0], -1)

X_tr = flatten(images_tr)

X_tr.shape

(38400, 784)

fig_pixels

from sklearn.preprocessing import StandardScaler

# 1. Initialize a StandardScaler object
image_scaler = StandardScaler()

# 2. Fit the scaler
image_scaler.fit(flatten(images_tr))

StandardScaler()

display(px.imshow(image_scaler.mean_.reshape(28,28), 
                  color_continuous_scale='gray_r', title="Mean image"))
display(px.imshow(image_scaler.var_.reshape(28,28), 
                  color_continuous_scale='gray_r', title="Variance image"))

def featurizer(images):
    flattened = flatten(images)
    return image_scaler.transform(flattened)

X_tr = featurizer(images_tr)

show_images(X_tr.reshape(images_tr.shape), max_images=10, labels=labels_tr)

df = pd.DataFrame({"color": ["red", "green", "red", "blue", "blue", "yellow", ""]})
df

from sklearn.preprocessing import OneHotEncoder
# 1. Initialize a OneHotEncoder object
ohe = OneHotEncoder()
# 2. Fit the encoder
ohe.fit(df[["color"]])

OneHotEncoder()

ohe.categories_

[array(['', 'blue', 'green', 'red', 'yellow'], dtype=object)]

ohe.transform(df[["color"]]).toarray()
ohe.categories_

[array(['', 'blue', 'green', 'red', 'yellow'], dtype=object)]

df['text'] = [
    "Red is a color.",
    "Green is for green food.",
    "Red reminds me of red food.",
    "Blue is my favorite color!",
    "Blue is for Cal!",
    "Yellow is also for Cal!",
    "I forgot to write something."
]

from sklearn.feature_extraction.text import CountVectorizer

# 1. Initialize a CountVectorizer object
vectorizer = CountVectorizer()

# 2. Fit the vectorizer
vectorizer.fit(df["text"])

CountVectorizer()

pd.DataFrame(vectorizer.transform(df["text"]).toarray(), 
             columns=vectorizer.get_feature_names_out())

from sklearn.linear_model import LogisticRegression

lr_model = LogisticRegression()
lr_model.fit(X=X_tr, y=labels_tr)

/opt/homebrew/Caskroom/mambaforge/base/envs/py_3_11/lib/python3.11/site-packages/sklearn/linear_model/_logistic.py:470: ConvergenceWarning:

lbfgs failed to converge after 100 iteration(s) (status=1):
STOP: TOTAL NO. OF ITERATIONS REACHED LIMIT

Increase the number of iterations to improve the convergence (max_iter=100).
You might also want to scale the data as shown in:
    https://scikit-learn.org/stable/modules/preprocessing.html
Please also refer to the documentation for alternative solver options:
    https://scikit-learn.org/stable/modules/linear_model.html#logistic-regression

LogisticRegression()

lr_model = LogisticRegression(tol=0.05, solver='saga', random_state=42)
lr_model.fit(X=X_tr, y=labels_tr)

LogisticRegression(random_state=42, solver='saga', tol=0.05)

print("model.coef_.shape:", lr_model.coef_.shape)
print("model.intercept_.shape:", lr_model.intercept_.shape)
print(lr_model.coef_)
print(lr_model.intercept_)

model.coef_.shape: (10, 784)
model.intercept_.shape: (10,)
[[ 9.90445492e-05 -6.36010321e-03 -3.85913757e-03 ...  1.49595978e-03
   4.32587736e-03  2.73064427e-03]
 [-1.89699677e-03  6.63981322e-03 -7.47402405e-03 ... -1.80362390e-02
  -1.84524048e-02 -1.52846533e-02]
 [-7.43264082e-04 -4.46484428e-03  1.60046019e-03 ...  5.50850058e-03
   1.38217724e-02  3.68772263e-03]
 ...
 [ 1.77951137e-04 -1.08447436e-03 -8.59128688e-04 ... -5.03797045e-03
  -1.78474348e-03 -2.49799352e-03]
 [-8.24675871e-03 -2.41366751e-03 -7.31344979e-03 ... -1.80925346e-02
  -1.21750176e-02 -1.40790500e-03]
 [-1.69500201e-04  7.44355526e-05 -5.08764217e-03 ... -5.67020645e-03
  -1.32036337e-03 -1.92847951e-03]]
[-0.03276315  0.01498156  0.02486191 -0.00368395  0.04477243 -0.06132416
  0.09267479 -0.03592529 -0.00330317 -0.04029096]

coeffs = lr_model.coef_
show_images(coeffs.reshape(10, 28, 28), labels=lr_model.classes_)

from sklearn.neural_network import MLPClassifier
mlp = MLPClassifier(
    hidden_layer_sizes=(100, 50), 
    max_iter=100, tol=1e-3, random_state=42)

mlp.fit(X=X_tr, y=labels_tr)

MLPClassifier(hidden_layer_sizes=(100, 50), max_iter=100, random_state=42,
              tol=0.001)

lr_model

LogisticRegression(random_state=42, solver='saga', tol=0.05)

X_val = featurizer(images_val)

n_small = 1000
X_tr_small = X_tr[:n_small,:]
labels_tr_small = labels_tr[:n_small]

from sklearn.metrics import log_loss

C_vals = np.logspace(-5, 1, 20)

logprob_tr = []
logprob_val = []
acc_tr = []
acc_val = []

for C in C_vals:
    print("starting training with C =", C)
    model = LogisticRegression(tol=1e-3, random_state=42, C=C)
    model.fit(X=X_tr_small, y=labels_tr_small)
    
    # compute the logprob accuracy
    logprob_tr.append(-log_loss(labels_tr_small, model.predict_proba(X_tr_small), labels=model.classes_))
    logprob_val.append(-log_loss(labels_val, model.predict_proba(X_val), labels=model.classes_))

    # compute the accuracy
    acc_tr.append(np.mean(model.predict(X_tr_small) == labels_tr_small))
    acc_val.append(np.mean(model.predict(X_val) == labels_val))

starting training with C = 1e-05
starting training with C = 2.06913808111479e-05
starting training with C = 4.281332398719396e-05
starting training with C = 8.858667904100833e-05
starting training with C = 0.00018329807108324357
starting training with C = 0.000379269019073225
starting training with C = 0.0007847599703514606

starting training with C = 0.001623776739188721
starting training with C = 0.003359818286283781
starting training with C = 0.0069519279617756054

starting training with C = 0.01438449888287663
starting training with C = 0.029763514416313162
starting training with C = 0.06158482110660261

starting training with C = 0.1274274985703132
starting training with C = 0.26366508987303555
starting training with C = 0.5455594781168515
starting training with C = 1.1288378916846884

starting training with C = 2.3357214690901213
starting training with C = 4.832930238571752
starting training with C = 10.0

df_logprob = pd.DataFrame({
    "C_val": C_vals, 
    "Train": logprob_tr, "Validation": logprob_val,
}).set_index("C_val") 

display(
    px.line(df_logprob, 
        labels={"value": "Avg. Log Prob.", "C_val": "Reg. Parameter C"},
        title="LR Classifier Log Prog vs Reg. Parameter",
        markers=True,
        log_x=True,
        width=800, height=500)
)

df_acc = pd.DataFrame({
    "C_val": C_vals, 
    "Train": acc_tr, "Validation": acc_val
}).set_index("C_val") 

display(
    px.line(df_acc, 
        labels={"value": "Accuracy", "C_val": "Reg. Parameter C"},
        title="LR Classifier Accuracy vs Reg. Parameter",
        markers=True,
        log_x=True,
        width=800, height=500
    )
)

lr_model.predict(X_tr[:10,:])

array(['Ankle boot', 'Coat', 'Ankle boot', 'T-shirt/top', 'Pullover',
       'Ankle boot', 'Dress', 'T-shirt/top', 'Coat', 'Sandal'],
      dtype='<U11')

show_images(images_tr[:10,:].reshape(10, 28, 28),
            labels = lr_model.predict(X_tr[:10,:]))

k = 10
tmp_labels = labels_tr[:k] + " (pred=" + lr_model.predict(X_tr[:k,:]) + ")"
show_images(images_tr[:k,:].reshape(k, 28, 28), labels=tmp_labels)

lr_model.predict_proba(X_tr[:5,:])

array([[9.51642010e-01, 1.25766964e-03, 8.94327054e-07, 3.11486837e-07,
        2.59469407e-07, 7.35306052e-03, 1.78581053e-07, 3.97435123e-02,
        5.22696365e-07, 1.58056694e-06],
       [1.05752334e-04, 2.47086595e-03, 8.32072100e-01, 3.44094506e-03,
        4.58904789e-02, 4.24209010e-05, 1.13951633e-01, 1.94167275e-05,
        1.55456636e-03, 4.51820449e-04],
       [9.30078717e-01, 1.40564685e-03, 1.91994009e-06, 6.84403412e-07,
        8.73522603e-07, 9.24863395e-03, 8.71969951e-07, 5.92557003e-02,
        1.75317539e-06, 5.19911487e-06],
       [2.05798117e-04, 2.21031435e-05, 6.61559787e-04, 2.37402967e-02,
        2.18046824e-02, 2.07214721e-05, 3.03973688e-02, 1.53740432e-04,
        9.18742226e-01, 4.25150290e-03],
       [2.23839377e-04, 9.60149725e-02, 1.08016253e-01, 2.85455925e-04,
        7.19252331e-01, 1.85483941e-03, 7.24570316e-02, 3.23939232e-04,
        1.53916187e-03, 3.21759981e-05]])

k = 10
df = pd.DataFrame(lr_model.predict_proba(X_tr[:k,:]), columns=lr_model.classes_)
bars = px.bar(df, barmode='stack',orientation='v')
bars.update_layout(xaxis_tickmode='array', xaxis_tickvals=np.arange(k))
display(bars)
tmp_labels = labels_tr[:k] + " (pred=" + lr_model.predict(X_tr[:k,:]) + ") img: " + np.arange(k).astype(str)
show_images(images_tr[:k,:].reshape(k, 28, 28), labels=tmp_labels)

np.mean(lr_model.predict(X_tr) == labels_tr, axis=0)

np.float64(0.8488541666666667)

X_te = featurizer(images_te)

np.mean(lr_model.predict(X_te) == labels_te, axis=0)

np.float64(0.84075)

from sklearn.metrics import accuracy_score

train_acc = accuracy_score(labels_tr, lr_model.predict(X_tr))
val_acc = accuracy_score(labels_val, lr_model.predict(X_val))
test_acc = accuracy_score(labels_te, lr_model.predict(X_te))

print("Train accuracy:", train_acc)
print("Validation accuracy:", val_acc)
print("Test accuracy:", test_acc)

Train accuracy: 0.8488541666666667
Validation accuracy: 0.849375
Test accuracy: 0.84075

np.random.seed(42)
print("Model Accuracy:", np.mean(lr_model.predict(X_val) == labels_val, axis=0))
print("Random Guess Accuracy:", 
      np.mean(np.random.choice(lr_model.classes_, size=len(labels_te)) == labels_te, axis=0))

Model Accuracy: 0.849375
Random Guess Accuracy: 0.10108333333333333

isWrong = lr_model.predict(X_val) != labels_val
# make a histogram with frequency of correct and incorrect predictions
fig = px.histogram(labels_val[isWrong], histnorm='percent')
fig.update_layout(xaxis_title="Label", 
                  yaxis_title="Percentage of Incorrect Predictions")
fig.update_xaxes(categoryorder="total descending")

from sklearn.metrics import confusion_matrix

fig = px.imshow(
    confusion_matrix(labels_val, lr_model.predict(X_val)), 
    color_continuous_scale='Blues'
    )
fig.update_layout(
        xaxis_title="Predicted Label",
        yaxis_title="True Label",
        coloraxis_showscale=False,
        xaxis=dict(tickmode='array', tickvals=np.arange(len(model.classes_)), ticktext=model.classes_),
        yaxis=dict(tickmode='array', tickvals=np.arange(len(model.classes_)), ticktext=model.classes_)
    )

	categories	'auto'
	drop	None
	sparse_output	True
	dtype	<class 'numpy.float64'>
	handle_unknown	'error'
	min_frequency	None
	max_categories	None
	feature_name_combiner	'concat'

	input	'content'
	encoding	'utf-8'
	decode_error	'strict'
	strip_accents	None
	lowercase	True
	preprocessor	None
	tokenizer	None
	stop_words	None
	token_pattern	'(?u)\\b\\w\\w+\\b'
	ngram_range	(1, ...)
	analyzer	'word'
	max_df	1.0
	min_df	1
	max_features	None
	vocabulary	None
	binary	False
	dtype	<class 'numpy.int64'>

	hidden_layer_sizes	(100, ...)
	activation	'relu'
	solver	'adam'
	alpha	0.0001
	batch_size	'auto'
	learning_rate	'constant'
	learning_rate_init	0.001
	power_t	0.5
	max_iter	100
	shuffle	True
	random_state	42
	tol	0.001
	verbose	False
	warm_start	False
	momentum	0.9
	nesterovs_momentum	True
	early_stopping	False
	validation_fraction	0.1
	beta_1	0.9
	beta_2	0.999
	epsilon	1e-08
	n_iter_no_change	10
	max_fun	15000

Lecture 03 – CS 189, Fall 2025

The Learning Problem

Looking at the Data

Understanding The Raw Features (Images)

Understanding the Labels

Reviewing the Learning Setting

Train-Test-Validation Split

Model Design

Feature Engineering

Naive Image Featurization

Standardization

One-Hot Encoding

Bag of Words

Modeling and Optimization

Training (Fitting) a Classifier

Parameters

Neural Networks¶

Hyperparameters

Evaluating the Model

Predicting Probabilities

Accuracy Metrics and Test Performance

Last Thoughts

	also	blue	cal	color	favorite	food	for	forgot	green	is	me	my	of	red	reminds	something	to	write	yellow
0	0	0	0	1	0	0	0	0	0	1	0	0	0	1	0	0	0	0	0
1	0	0	0	0	0	1	1	0	2	1	0	0	0	0	0	0	0	0	0
2	0	0	0	0	0	1	0	0	0	0	1	0	1	2	1	0	0	0	0
3	0	1	0	1	1	0	0	0	0	1	0	1	0	0	0	0	0	0	0
4	0	1	1	0	0	0	1	0	0	1	0	0	0	0	0	0	0	0	0
5	1	0	1	0	0	0	1	0	0	1	0	0	0	0	0	0	0	0	1
6	0	0	0	0	0	0	0	1	0	0	0	0	0	0	0	1	1	1	0

	penalty	'l2'
	dual	False
	tol	0.0001
	C	1.0
	fit_intercept	True
	intercept_scaling	1
	class_weight	None
	random_state	None
	solver	'lbfgs'
	max_iter	100
	multi_class	'deprecated'
	verbose	0
	warm_start	False
	n_jobs	None
	l1_ratio	None

	copy	True
	with_mean	True
	with_std	True

	also	blue	cal	color	favorite	food	for	forgot	green	is	me	my	of	red	reminds	something	to	write	yellow
0	0	0	0	1	0	0	0	0	0	1	0	0	0	1	0	0	0	0	0
1	0	0	0	0	0	1	1	0	2	1	0	0	0	0	0	0	0	0	0
2	0	0	0	0	0	1	0	0	0	0	1	0	1	2	1	0	0	0	0
3	0	1	0	1	1	0	0	0	0	1	0	1	0	0	0	0	0	0	0
4	0	1	1	0	0	0	1	0	0	1	0	0	0	0	0	0	0	0	0
5	1	0	1	0	0	0	1	0	0	1	0	0	0	0	0	0	0	0	1
6	0	0	0	0	0	0	0	1	0	0	0	0	0	0	0	1	1	1	0

	also	blue	cal	color	favorite	food	for	forgot	green	is	me	my	of	red	reminds	something	to	write	yellow
0	0	0	0	1	0	0	0	0	0	1	0	0	0	1	0	0	0	0	0
1	0	0	0	0	0	1	1	0	2	1	0	0	0	0	0	0	0	0	0
2	0	0	0	0	0	1	0	0	0	0	1	0	1	2	1	0	0	0	0
3	0	1	0	1	1	0	0	0	0	1	0	1	0	0	0	0	0	0	0
4	0	1	1	0	0	0	1	0	0	1	0	0	0	0	0	0	0	0	0
5	1	0	1	0	0	0	1	0	0	1	0	0	0	0	0	0	0	0	1
6	0	0	0	0	0	0	0	1	0	0	0	0	0	0	0	1	1	1	0