-
Notifications
You must be signed in to change notification settings - Fork 0
/
thesis.tex
8516 lines (7457 loc) · 455 KB
/
thesis.tex
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
%% In .emacs: (savehist-mode 1)
%% pdflatex thesis.tex &> /dev/null; bibtex thesis &> /dev/null; pdflatex thesis.tex &> /dev/null
\documentclass[phd,ianc,twoside]{infthesis}
\usepackage{graphicx}
\usepackage{natbib}
\usepackage{amsmath}
\usepackage{siunitx}
\usepackage{pdfpages}
\usepackage{amsbsy}
% Used to table in TCAL chapter
\usepackage{multirow,bigdelim}
\usepackage{array}
\usepackage{amssymb}
\usepackage{color}
\usepackage{hyperref}
% Make notes
\usepackage{xargs}
\usepackage{todonotes}
\usepackage{mathtools}
% Lancet component table
\usepackage{tabularx}
% Used to define \tbf
\usepackage{bold-extra}
\newcommand{\chapquote}[3]{\begin{quotation} \textit{#1} \end{quotation} \begin{flushright} - #2, \textit{#3}\end{flushright} }
% Lancet table colors
\definecolor{txtwhat}{rgb}{0.988,0.31,0.31}
\definecolor{txthow}{rgb}{0.11,0.6,0.11}
\definecolor{txtwhere}{rgb}{0.31,0.31,0.988}
\definecolor{darkG}{rgb}{0,0.6,0}
\definecolor{darkR}{rgb}{0.6,0,0}
\definecolor{darkY}{rgb}{0.8,0.6,0}
\newcommandx{\TODO}[2][1=]{\todo[backgroundcolor=red!25,inline]{TODO: #2}}
\newcommandx{\KEY}[2][1=]{\todo[backgroundcolor=yellow!25,inline]{KEY: #2}}
\newcommandx{\QUERY}[2][1=]{\todo[backgroundcolor=green!25,inline]{QUERY: #2}}
\newcommand{\tbf}[1]{\texttt{\textbf{#1}}}
%% Stated word count in intention to submit: 60k
%% TODO: Send thesis to Cyril
%% Information about the title, etc.
\title{Spatiotemporal properties of evoked neural response in the primary visual cortex}
\author{Jean-Luc Richard Stevens}
%% Optionally, specify the graduation month and year:
% \graduationdate{February 1786}
\abstract{
How is the visual world represented in the primary visual cortex of the
primate visual system? When a novel visual stimulus is projected onto
the retina, a complex, dynamic pattern of neural activity is evoked
across the cortical surface. Understanding the spatiotemporal properties
of this activity is a fundamental problem in neuroscience and it
requires a unified framework to bridge the gap from single neuron
activity to the response of the population as a whole.
The evoked cortical response of an individual neuron is determined
not only by the particular properties of a visual stimulus and the
internal response properties of the cell, but by the collective
dynamics of an entire network of interconnected neurons. On longer
timescales, this network structure is itself shifting as
activity-dependent plasticity gradually shapes the connectivity
between the cells as they respond to the visual environment.
The response of a single cortical neuron is then the outcome of an
extended spatiotemporal history of the activity across an entire
population, driven by the interplay between the neural activity
itself and the plasticity of the network on short and long
timescales. These interlocking processes shape the cortical response
and the cortical structure in relation to the short-term and
long-term history of visual input. In order to untangle this
complexity it is useful to build simplified computational models
that incorporate the essential features of these interactions.
The approach taken here is to bring these interlocking processes
together in a single, unified spatiotemporal model of cortical
activity. The aim is to relate the response of individual units to
the response dynamics of the entire, spatially extended population
while simultaneously bridging the gap from transient activity
responses to the long-term development of the network
structure. This attempt to unify broad spatial and temporal scales
is novel and requires a synthesis that spans experimental and
modeling approaches that are normally considered in isolation.
This thesis starts with background material describing how the early
visual system is organized, together with a description of how
neurons in the mammalian primary visual cortex develop their basic
response properties. This is followed by a review of the relevant
experimental data as well and a summary of relevant computational
modeling work. This chapter covers the experimental and modeling
literature regarding the electrical activity of single cells, the
spatiotemporal response patterns observed across the cortical
surface, and concludes by describing the emergence of feature
selectivity across the cortical surface over development.
Following the background chapter, an important part of the research
process itself is addressed, namely the need for an exploratory,
yet reproducible workflow. Easy exploration of high-dimensional data
is vital when validating large computational models as it is
necessary to explore the space of model behavior and check that the
necessary experimental constraints are satisfied. A new, general, and
reproducible workflow is established in order to ensure that the
scientific work presented in this thesis can be understood and used
by future researchers in an extensible and maintainable manner.
Using these research tools, the task of bridging spatial and
temporal scales is split into three distinct steps that are each
assigned to a corresponding results chapter. The first of these
chapters is an account of how the evoked response observed at the
level of a single neuron relates to the overall population
dynamics. The simple model presented aims to relate single-unit
responses recorded using electrophysiology to the population
response observed with optical imaging. Only data recorded in mature
animals on short timescales is considered, allowing the network
structure to be treated as static. The resulting model is the first
to show how realistic single-unit responses can add up to the very
different population-level evoked responses measured using
voltage-sensitive-dye imaging over large cortical areas.
Next we turn to modeling how cortical structure self-organizes over
slower developmental timescales into smooth orientation maps over
the cortical surface. In order to properly evaluate developmental
map models, a novel, automated map quality metric is presented that
allows simulated maps to be quantitatively compared to
experimentally recorded orientation maps across different mammalian
species. This metric is used to analyze the components of the GCAL
developmental model that forms the basis for the model presented in
the final results chapter.
In the last results chapter, these threads are tied together into a
developmental model that incorporates a more realistic model of
time, including calibrated transient neural response as well as
orientation map formation. The resulting unified model demonstrates
how neural response in the mammalian primary visual cortex for large
cortical populations may be accounted for by a simple model that
bridges millisecond timescales to the developmental timescales
necessary for the emergence of feature preferences.
}
\begin{document}
\begin{preliminary}
\maketitle
\begin{acknowledgements}
First of all, I give my sincere thanks to my first supervisor, James
A. Bednar (Jim) for his tireless help and support over the past five
years. He has consistently provided me with guidance and encouragement
and has shown an immense amount of patience. I would also like to thank
my second supervisor, Fr\'{e}d\'{e}ric Chavane (Fredo) for his crucial
scientific insights, and for inviting me to his lab in Marseille.
I would like to acknowledge all the members of the Institute for
Adaptive and Neural Computation for providing a supportive academic
environment and I would especially like to thank Peggy Seri\`{e}s for
her useful feedback at our yearly review meetings. A special thanks to
the Neuroinformatics DTC for offering a flexible and engaging PhD
program.
Thanks to Philipp R\"{u}diger for the many interesting and helpful
discussions we have had and particularly, for our close collaboration on
our software projects. I would like to thank my colleagues and friends,
Nikos Gekas, Duncan Carmichael, and Robert Court for so many enjoyable
conversations over our write-up lunches.
Finally, I am most grateful to my Mum and Dad for their support and for
allowing me to stay with them over the last stages of my project.
\end{acknowledgements}
\standarddeclaration
\tableofcontents
%% List of figures or tables
% \listoffigures
% \listoftables
\end{preliminary}
%% \TODO{UPDATE ABSTRACT. Fill in the necessary forms again. Submit with USB sticks.}
%% \TODO{Wrap all of SIRD, CGCAL, TCAL, GCAL in mboxes?}
\chapter{Introduction}
\label{chapter:introduction}
The brain is an information-processing organ that integrates sensory
information and controls behavior. In higher mammals, a significant
portion of this function is directed by the cerebral cortex, the outer
few millimeters of brain tissue composed of billions of neurons and
trillions of synaptic connections. The cerebral cortex is known to be
highly adaptable, and the neural responses within it are associated with
a diverse set of faculties, including executive function, motor control,
and sensory processing. Of all the cortical areas, the primary visual
area (V1) is perhaps the most well studied.
Visually evoked activity in primary visual cortex arises due to
interactions between a visual stimulus and the corresponding
neural substrate. This neural tissue is defined by an extended network of
cells that are richly interconnected, with connectivity patterns that
are neither entirely genetically predetermined nor entirely
random. Instead, much of the adaptability of the cortex and its
connectivity patterns are grounded in a slow, ongoing learning process.
Much of this learning is activity driven, mapping each evoked activity
response to tiny synaptic changes in the network which are then
projected onto future evoked responses. This process suggests how the cortex is
able to functionally adapt and perform useful computations: it
engages in a continual learning process that collects information about
the structure of the environment while simultaneously responding to
it. It is this interaction between environment, neural structure, and
evoked response that defines the process of vision as well as many of
the other faculties of the neocortex.
This overall theoretical picture is supported by a vast scientific
literature, with strong evidence supporting each piece of the
puzzle. For instance, recording cortical activity in response to a
visual stimulus is one of the core activities in experimental visual
neuroscience. The assumption that this activity reflects the
integration of incoming activity across synapses is one of the central
dogmas of the field. Indeed, much of visual neuroscience is concerned with
understanding how the activity evoked by a visual stimulus is
integrated by neurons across their synapses.
An equally substantial literature is concerned with how neurons and
synapses change over time. As outlined in Chapter \ref{chapter:background},
the idea that the synaptic structure of the
cortical network is plastic and shaped through learning processes is
supported by decades of experimental work. In primary visual cortex, the
functional and structural properties of the neural tissue have been
manipulated by modifying the long term visual statistics of the
environment using dark rearing, monocular deprivation, and goggle rearing
paradigms. These types of experiments are extremely difficult, involving
long-running experiments that span the critical periods of
development as the animal matures.
The time and expense of performing chronic experiments,
especially for primates, has resulted in a clear divide in the
scientific literature. On one hand, there is an extensive literature
focused on the properties of the evoked activity, typically concerned
with recording the response of neurons in the adult animal. On the
other, there is a sparser developmental literature, featuring chronic
experiments that record how neural responses change as the organism
matures. Both these literatures contribute important insights to our
understanding of the neural basis of vision.
One unfortunate consequence of this split is that theoretical frameworks
are divided along similar lines. It is clearly important for theory to make
contact with experiments, which helps explain this symmetry between theory
and experiment. Yet given the general lack of overarching theories in
neuroscience, and given what we do know about cortex and its functional
properties, there is a clear need for suitable theoretical frameworks
that can close this gap.
What computational models offer are a way to gain new insights into the
process of vision by connecting theory to experiment, allowing
different sources of experimental data to be integrated into a cohesive
whole. Models can make unstated assumptions explicit and can help
illuminate key principles. Ideally, by applying the right
simplifications, a model can help cut through overwhelming biological
complexity to suggest which of the many observations about a system are
crucial for a given result. So far, however, models have not
attempted to bridge the gap between the experimental data measuring
evoked response over tens or hundreds of milliseconds, and
experimental data that probes the developmental process over time
scales of days or weeks.
To cover such a broad span of time on practical computing systems,
such a model cannot also include a detailed account of each cell's intrinsic
properties as well as the detailed biophysics of their
connectivity. What such a unified model \emph{can} offer is the big picture,
allowing different types of experiment to be related to each other
within a single theoretical framework. If we can establish how the
primary visual cortex works at a coarse, general level, it will be
possible to add specific details as necessary, by using new experimental
data to constrain model parameters and making use of improved
computational resources to run bigger, more detailed simulations.
Thus the models in this thesis will focus on simulating firing rates
rather than individual neural spikes.
Building a framework that account for how neurons respond within a
large, extended population timescales covering from milliseconds to
weeks is no easy task. The purpose of this thesis is to demonstrate is
that this problem can be tackled in a meaningful, extensible way that
opens up exciting new lines of scientific enquiry.
\section{Aims and structure}
\label{section:Aims}
The aim of this thesis is to build a modeling framework that can
simulate the evoked response of a spatially extended population of
neurons in the primary visual cortex within an appropriate context. The
context relevant to a visual neuron spans at least three different
levels: (1) the evoked response of the neuron itself, along with the immediate
response properties of the surrounding neural population and their
connectivity to that particular neuron, (2) the history of spatiotemporal
activity across the network that explains how this specific connectivity
pattern arose, and (3) the long-term statistics of the visual environment,
which shapes this connectivity and gives a neural response the context
necessary to convey meaningful information about the visual world.
In addition to these primary aims, a core goal is to make this model
simple, understandable, and extensible. Creating a general framework is
only useful if it opens up new possibilities for answering research
questions posed by other scientific researchers. Simplicity and
reproducibility are two aims that do not target specific scientific
results but do target something equally, if not more important, namely
the scientific process itself.
This thesis has the following chapters, structured in a way designed
to bridge two very different forms of computational modeling in a
simple, reproducible, and understandable way:
\begin{description}
\item[Chapter 2] The Background chapter starts with a description of
different modeling approaches and their relation to each other, with
special attention to developmental modeling approaches. This is
followed by the anatomical background and then the background
information regarding the key models and experimental data referred to
throughout the rest of the thesis. This material is split between
material that accounts for the evoked response properties of neurons
and material that concerns cortical development; unfortunately there
is very little intersection between the two.
\item[Chapter 3] This chapter discusses the importance of scientific
reproducibility and introduces Lancet and HoloViews, two new open-source
Python-programming tools developed during this thesis project that greatly assist
scientific productivity, reproducibility, and communication within a
literate programming environment. The chapter focuses on how these
tools were used to enable the scientific work presented in this
thesis, but they are also very powerful in general, and actively
used by researchers across different disciplines, worldwide.
\item[Chapter 4] This chapter introduces the SIRD model, which links
single unit, firing-rate responses generated by the well-validated IRD
model to the corresponding population response as observed with
voltage-sensitive--dye imaging (VSDI). This model has a very simple
mathematical formulation that incorporates extensive calibration
against available experimental data. It is the first model of the
spatiotemporal VSDI response that accounts for the mechanisms involved
in relating single-unit activity to the bulk population response.
\item[Chapter 5] This chapter analyzes and validates a self-organizing
map model called GCAL, which unlike the SIRD model accounts for
developmental processes and includes a mechanistic subcortical
pathway. A new map-quality metric is introduced, which was used to
complete the analysis needed to validate this model. This led to the
publication of the GCAL model, which is simpler, more biologically
plausible, and more robust than its predecessors. This analysis is used
again in the rest of the thesis and GCAL is the basis of the final
TCAL model presented in the following chapter.
\item[Chapter 6] This chapter further simplifies GCAL while improving
the way it processes temporal events to make it more suitable for
modeling evoked response properties, resulting in an approximately
equivalent model called CGCAL. CGCAL, in turn, is used to build a new,
temporally calibrated model called TCAL. TCAL features plausible
firing rate profiles on the timescale of the evoked response, as well
as self-organization of connectivity on the timescale of
development. TCAL is analyzed using the map metric introduced in the
previous chapter and it is demonstrated that this model links to the
SIRD model discussed in the fourth chapter, providing a mechanistic
implementation of a developmental process that leads to the type of
processing supported by SIRD.
\item[Chapter 7] This chapter discusses the overall results from the
thesis, putting them into context, and suggests various possible directions for
future work. The intention is to provide suggestions for exciting new
research projects that can build on the framework that is developed in
this thesis.
\item[Chapter 8] The final chapter provides a short conclusion intended to
summarize the main contributions of this work.
\item[Appendix] For the convenience of the reader, this section
includes three papers relating to this work
that were published over the course of this project.
\end{description}
Another way of understanding the structure of the thesis as well as the
relationship between the various models provided is using the
breakdown in Table \ref{table:Model_features}. This table lists the
models in the order they are presented, including a breakdown of their
various key features. What is meant by each feature listed will be made
clear in Chapter \ref{chapter:background}. What is important to note is
that the SIRD model extends the IRD model, and that the final TCAL
builds on the CGCAL model which in turn builds on the GCAL model.
\newcolumntype{L}[1]{>{\raggedright\let\newline\\\arraybackslash\hspace{0pt}}m{#1}}
\newcolumntype{C}[1]{>{\centering\let\newline\\\arraybackslash\hspace{0pt}}m{#1}}
\newcolumntype{R}[1]{>{\raggedleft\let\newline\\\arraybackslash\hspace{0pt}}m{#1}}
\newcommand{\yes}{\textcolor{darkG}{\checkmark}}
\newcommand{\no}{\textcolor{darkR}{\text{\sffamily x}}}
\newcommand{\maybe}{\textcolor{darkY}{\text{\bf \sffamily !}}}
\begin{table}
\center
\hspace{-1em}
\begin{tabular}{|L{6.3cm}|c|c|c|c|c|l}
\cline{2-6}
\multicolumn{1}{c|}{} & \it{IRD} & \it{SIRD} & {\it GCAL} & \it{CGCAL} & \it{TCAL} \\
\cline{1-6}
Simulation of several mm$^2$ of cortex & \no & \yes & \yes & \yes & \yes & \rdelim\}{6}{3mm}[Development] \\
\cline{1-6}
Mechanistic subcortical pathway & \no & \no & \yes & \yes & \yes & \\
\cline{1-6}
Orientation maps & \no & \no & \yes & \yes & \yes \\
\cline{1-6}
Encodes first-order visual statistics & \no & \no & \yes & \yes & \yes\\
\cline{1-6}
Specific lateral connectivity & \no & \no& \yes & \yes & \yes \\
\cline{1-6}
Diversity of tuning properties & \no & \no & \yes & \yes & \yes \\
\cline{1-6}
\emph{Continuous model of time} & \yes & \yes & \no & \yes & \yes &\rdelim\}{3}{3mm}[Evoked]\\
\cline{1-6}
\emph{Plausible firing rate profiles} & \yes & \yes & \no & \no & \yes \\
\cline{1-6}
\emph{Calibrated against VSDI data} & \no & \yes & \no & \no & \no \\
\cline{1-6}
\end{tabular}
\caption{{\bf Key features of the five rate-based models in the order
they are presented in this thesis.} The IRD model is described in
Chapter \ref{chapter:background} as a way of summarizing the firing
rate properties of individual neurons. Next, the SIRD model is
introduced in Chapter \ref{chapter:SIRD}, extending the IRD model to
model the response of a spatially extended population of neurons. In
Chapter \ref{chapter:GCAL}, the focus switches to the developmental
process using a model called GCAL, simulating a spatially extended
population of neurons over long timescales. In Chapter
\ref{chapter:GCAL}, this model is adapted to operate on a continuous
timebase to define the CGCAL model. Lastly, a temporally calibrated
version of CGCAL called TCAL is constructed which shows how a
mechanistic, developmental model can be connected back to the SIRD
model. As TCAL inherits many of its properties from the GCAL model,
the main focus of this thesis is driven by the features relating to
the evoked response, indicated in the italic font.}
\label{table:Model_features}
\end{table}
The goal of the final TCAL model is to demonstrate how firing-rate
models can connect the response profiles of single units in the evoked
response to the structural changes that occurs across large populations
of neurons in the primary visual cortex over long, developmental time
periods. This framework is designed to be simple and extensible, and it
is hoped that future researchers will use TCAL as a platform to pose
new and groundbreaking research questions that could not be tackled
using existing computational modeling approaches.
\chapter{Background}
\label{chapter:background}
The goal of the final model presented in this thesis is to integrate a
wide range of theoretical and experimental findings into a single
mechanistic framework. In order to assess the validity of any
computational model it is necessary to understand its structure,
behavior, and overall scope. This chapter aims to cover the
relevant literature necessary to understand the work presented in later
chapters.
The structure of a model may be understood at a mathematical or
algorithmic level and for mechanistic models, biological plausibility
should also be evaluated. The behavior of a model may be assessed in relation
to experimental measurements used to reveal the functional dynamics of
the biological system. Which set of experimental constraints are
appropriate for assessing a model's plausibility are determined by its
intended scope.
This chapter starts with a brief overview of four different types of
cortical computational modeling approaches, followed by an overview of
the relevant anatomy of the early primate visual system. This data will be
used to justify the structural components of the models presented in
subsequent chapters. The rest of this chapter outlines the relevant
experimental findings and related theoretical concepts that will be
referred to later on in the thesis. Data recorded from macaque monkey
will be presented where possible, since this is the species that will
be targeted for modeling, but data from other species will be
considered for the many cases when macaque data is not available.
% Chronic 2-photon from Fitzpatrick lab can do it, but not in primate so far
Note that no single experimental technique has been demonstrated in
primate to record a
large cortical area over many weeks while simultaneously offering the
spatiotemporal resolution to resolve single neurons and their responses
within individual fixations. Due to the tradeoffs in spatial and
temporal resolution across different experimental techniques, it is
necessary to consider several different sources of experimental data
together.
This need to combine results across experimental techniques is driven by
the incredible biological complexity that underpins cortical
activity. At each moment, the neural response is determined by the
collective interaction of a large interconnected population of
individual cells that are each shaped by their surrounding environment
and long-term history of synaptic inputs.
The experimental data across spatial and temporal scales will be
collected together in two main sections. First the evoked response will
be considered across spatial scales in adult macaque monkey, offering an
insight into how V1 responds at the end of the developmental process. In
the second section, cortical development is considered using the scarce
data obtained from chronic studies.
The experimental difficulty of recording chronically from single cells
is discussed, before the available developmental data is presented in the
form of chronic orientation map measurements using optical
imaging. Finally, existing self-organizing models of orientation map
models are described, including the details of the GCAL model that forms
the basis of the model presented in Chapter \ref{chapter:TCAL}.
\section{Computational modeling approaches}
The process of scientific research is based on the twin pillars of
theory and experiment. Neuroscience is no exception, and both
experimental and theoretical neuroscientists work together towards an
improved understanding of the nervous system, driven and validated by
experiment.
A computational model represents a concrete implementation of a theory
that may be used to integrate information across different
experiments, make novel predictions and bridge the gap between
theoretical concepts and empirical data. There are many different types
of computational model and this section will briefly describe some of
them, in order to place the work presented in this thesis in a broader
context.
The following categorization of approaches is relevant both for
neural map models \citep{bednar_fnc16} and more widely
across computational neuroscience. These definitions constitute a
partial and not mutually exclusive list of the different modeling
paradigms. In other words, any particular model may have components that
partially satisfy any of the following criteria in varying degrees:
%% Ideally, computational models will be designed to answer
%% specific questions that arise from either existing
%% experiments or theoretical considerations.
\begin{description}
%% use '\hfill \\' to break lines
\item[Phenomenological] These models designed to describe or reproduce
experimentally observed behavior without necessarily any reference to the underlying
mechanisms in the biological system. These models are also sometimes
called ``descriptive'' models, as they describe a phenomenon without
addressing its physical basis. The ``invariant response
descriptive model'' described in section \ref{section:IRD_background}
and used in Chapter \ref{chapter:SIRD}
is one example of such a model.
\item[Normative] These models are aimed at explaining some functional
criterion that is believed to be essential for the operation of a
biological system. Normative models do not need to be derived with
reference to the structure of neural elements or circuits and are
therefore distinct from mechanistic models.
\item[Mechanistic] These models explicitly claim an
isomorphism between elements of the model and the structure of
nervous system. A good mechanistic model must also be a good
phenomenological model, i.e., matching behavior as well as just
mechanisms.
% jbednar: broke this out from mechanistic, because there are
% non-mechanistic developmental models, such as the elastic net. The
% elastic net makes no claim of isomorphism of mechanisms, yet fits
% the criteria for a developmental model (or at least the authors
% present it as such, i.e., as an explanation for where the
% structure comes from).
\item[Developmental] Developmental models aim to explain how
adult-like circuitry or mechanisms emerge from some initial
conditions that are simpler or less well ordered. Most
developmental models are also mechanistic, claiming an isomorphism
between the initial stage and early stages in the organism's life
cycle, but some are much more abstract.
\end{description}
The aim of this thesis is to build a mechanistic, developmental model
of evoked neural activity in V1.
In general, all models have some phenomenological or descriptive
component, as every model has to begin with some set of initial
assumptions regarding natural behavior. For instance, a detailed
compartmental model of a neuron needs to assume the existence of ions with certain
behaviors that are not derived from some deeper theory of reality such
as quantum mechanics, but are simply assumed. The firing-rate models
considered in Chapters \ref{chapter:GCAL} and \ref{chapter:TCAL}
assume that some important aspect of the behavior of neurons can be
summarized by its firing rate.
Normative models are often based on abstract criteria regarding
optimality, typically involving the minimization or maximization of
some objective function. One famous example is the idea that receptive
field formation is determined by learning under a sparsity constraint
while attempting to minimize the image reconstruction error
\citep{olshausen_nature96}. Normative models do not need to be
mechanistic and mechanistic models are not necessarily normative, but a
complete explanation would ideally include both if the behavior is of
value to the organism. For this thesis, we will focus on
developmental, mechanistic models to try to connect behavior across a
wide range of time scales, but we will come back to the issue
of normative models for these phenomena in the final discussion.
\subsection{Mechanistic modeling}
A model may be described as mechanistic if the structure of the model
mirrors the relation of physical entities in the biological system. For
computational models of the cortex, mechanistic models thus typically
focus on neurons and their connectivity in a network. One common approach is to
model such a network as a population of interconnected spiking elements,
where individual action potentials are simulated.
There are many different spiking model types, ranging from detailed
conductance-based approaches such as multi-compartment models, to
approaches that greatly simplify the biophysics of action potential generation
such as integrate-and-fire networks. For a review of the simulation
strategies and algorithms used in spiking network model simulations, see
\citet{romain_jcn07}.
In general, the greater the detail of a spiking network model, the
greater the demand on computational resources and the greater the
requirement for experimental data to suitably constrain the biophysics
of all the model components. These technical challenges make it
impractical to simulate the detailed spiking response of cortical tissue on a spatial
scale of millimeters over long periods of simulation time such as hours,
days, and weeks. For this reason, spiking models are not a suitable
platform for examining the timescales that will be considered later on
in this thesis.
Another mechanistic approach is to approximate the behavior of neurons
directly at the level of their firing rates, further simplifying the
biophysics of the model elements. Network firing-rate models typically
use individual units to represent small collections of neurons instead
of individual cells. With more spikes to consider per unit time, this
approach helps improve the validity of representing the spiking
activity as a single floating-point number per model neuron.
Moreover, at least on general-purpose computing hardware with
floating-point processors, simulating a firing-rate network is much
less costly than modeling individual spikes at the level of individual
cells. Moreover, many of the experimental analyses in wide use, even
those for measuring very precise temporal phenomenal such as PSTHs
(peri-stimulus time histograms), effectively use a firing-rate level
of description. Together these properties make firing-rate approaches
particularly suitable for building mechanistic developmental models,
which we will consider in the next section.
\subsection{Developmental modeling}
\label{section:developmental_modeling}
Unlike many mechanistic models that simulate the neural activity on the scale
of milliseconds up to seconds, developmental models typically simulate the
structural changes to the nervous system that occur on the timescale of
hours, days, and weeks. This is because developmental models aim to explain how
adult-like circuitry arises in an organism from an earlier stage of
maturation. The initial condition of the developmental models we will be
considering is not concerned with the initial emergence of neural cells in
the cortex, but will focus on how their connectivity later changes as the
organism matures.
In order to make simulations feasible, mechanistic developmental models
have simplified cellular biophysics and often simulate neural activities
in terms of firing rate. What is lost in biophysical detail is
compensated for by the different types of phenomena and new scientific
questions that developmental models are able to address.
In cortical modeling, developmental models can be used to investigate
the remarkable plasticity and functional flexibility of the
neocortex. One striking illustration is provided by a set of experiments
that induced visual projections into the auditory cortex of ferret,
resulting in the development with visual receptive fields similar to
those of complex cells of primary visual cortex in auditory cells
\citep{sur_science88,roe_jn92}. In humans, there is similar evidence for
cross-modal compensation effects, such as evidence for altered visual
processing in the congenitally deaf \citep{karns_jn12}.
Similar effects have been demonstrated in developmental models, where
the same model results in different learned features, patterns, or
behavior according to the training statistics
\citep{bednar_jpp12,miikkulainen_2005}. For instance, it has been shown
that simulated orientation maps acquire similar biases when trained
with skewed orientation statistics, as experimentally observed in
goggle-rearing experiments \citep{stevens_jn13,tanaka_plosone09}.
These examples are compelling demonstrations that the structural and
functional properties of cortex are plastic and are emergent properties
of the developmental process. In turn, developmental models are the only
way to explore how the structure of the nervous system depends on the
statistical structure of the environment, which has important
philosophical implications.
Firstly, this dependence suggests a way to link mechanistic and normative models. A
mechanistic, developmental model with plasticity can potentially show
how a concrete, biologically plausible mechanism implements a normative
criterion, such as the expression of receptive field structure in terms
of natural image statistics \citep{hyvrinen_book09}.
Secondly, a developmental model can explain the causal link between
neural structure and the sensory input that has been received from the
external world via plasticity. This link is what makes a cortical area such
as the primary visual cortex be about vision and the receptive fields in
ferret auditory cortex also be about vision after suitable experimental
manipulation. This issue regarding what neural processing is
\emph{about} is closely related to the philosophical question known as
``symbol grounding''.
The philosophical debate around the symbol grounding problem originated
with John Searle's ``Chinese Room argument'' \citep{searle_bbs80}. This
thought experiment claims to demonstrate that a traditional computer
program cannot generate its own semantics, whereas natural systems, such
as the human brain, can. Framed in another way, the issue is to
understand how the components of a computation can meaningfully refer to the
appropriate entity in the external world.
In a non-developmental, mechanistic model where synaptic structure has
not been shaped by visual input, there is a similar problem. That is, how
can the computation performed by such a neuron truly correspond to vision if
the synaptic structure of the computation has at most an accidental
relationship to anything visual, rather than a causal relationship
as in developmental models?
The purpose of this thesis is to show how it is possible to construct a
single model that captures this relationship between visual input and
cortical structure on the timescale of development, and then to relate
this network structure to the evoked response addressed by other types
of mechanistic model on short timescales. These results will establish
a new class of mechanistic model that is able to explore
scientific questions that were outside the scope of all previous
modeling approaches, helping us get closer to a true understanding of
how the brain is constructed to represent its inputs in its evoked responses.
To explain how these models relate to the underlying biological
systems, the following sections will summarize the relevant biological
results.
\section{Anatomical background}
The neocortex is the highly convoluted layer of neural tissue covering
the surfaces of the cerebral hemispheres. The cortical surface is
composed of numerous regions associated with different faculties
including areas involved in primary sensory processing, cognitive and
linguistic performance, and motor output. This remarkable diversity in
function is supported by a laminar organization that remains remarkably
constant across the entire cortex.
The primary visual cortex (V1) is one of the most widely studied
cortical areas due to the relative simplicity of the afferent pathway
and the ease with which visual stimuli can be controlled and
manipulated. In addition, the surface of V1 is readily accessible
once a suitable opening in the skull has been made, enabling a number of
different experimental approaches including electrophysiology and
optical imaging techniques.
This section outlines the anatomical structure of the mammalian
early visual pathway involved in the transmission of information from
the visual environment to the cortical neurons of V1. This summary
covers the background material necessary to understand the various
components of the mechanistic models that will be discussed later on and
puts the experimental data used for calibration in context.
Although there is anatomical variation between different mammalian
species and the specific goal is to account for the cortical response
observed in macaque, this section is general enough to describe the
early visual pathway of any mammal that has smooth, well-organized
orientation maps. This level of generality is
deliberate, as experimental data is not always available for macaque,
especially when considering chronic recordings needed to calibrate the
developmental process. In particular, the chronic orientation map
recordings described in section \ref{section:ferret_map_stability} are
only available for ferret.
Figure \ref{fig:basic_anatomy} shows how the photoreceptors of the
retina of the eyes connect via the retinal ganglion cells (RGCs) to the
lateral geniculate nucleus (LGN) via one-to-one projections which in
turn connect to primary visual cortex via the optic radiations. The
information from the two eyes splits at the optic chiasm so that the
left visual hemifield maps the right hemisphere and vice versa.
\begin{figure}
\center
\includegraphics[width=0.6\textwidth]{./figures/basic_anatomy.pdf}
\caption{{\bf The mammalian early visual pathway.} Anatomy of the visual
pathway from the photoreceptors in the retina through the lateral
geniculate nucleus (LGN) in the thalamus to the primary visual cortex
(V1). On the right, the anatomical structures at each stage of visual
processing are shown. The top right schematic shows the photoreceptors
at the back of the retina where light is transduced into an electrical
signal which passes through the bipolar cells to the ganglion
cells. The axons of the ganglion cells form the optic nerve which
projects to the LGN shown in the middle schematic on the right. The
LGN has a laminar arrangement where each layer aligns input from both
eyes to form a retinotopic map of the contralateral portion of the
visual field. The majority of the axons from LGN neurons then project
via the optic radiations to V1, terminating in layer 4. The
organization of the parvocellular, magnocellular, and koniocellular
pathways is shown in both the LGN and V1 schematics, where the shading
indicates the pattern that emerges when V1 slices are stained for
the metabolic marker cytochrome oxidase. Reproduced from
\citet{solomon_naturerev07}.}
\label{fig:basic_anatomy}
\end{figure}
The classical receptive field of a visually responsive cell corresponds
to the best stimulus pattern found to evoke a response. Figure
\ref{fig:example_RFs}A shows a schematic of the center-surround
receptive-field structure typical of a mammalian LGN ON cell as well as
an example recorded from cat. Part B of the figure shows the
corresponding schematic for a V1 neuron composed of an ON and OFF lobe
as well as a typical example of an oriented receptive field recorded
from simple cell in area 17 (cat). This elongated, Gabor-like receptive
field is also observed in macaque, as can be seen in the simple cell
spatiotemporal RF in Figure \ref{fig:example_RFs}C.
% jbednar: Maybe should use a directionally selective cell in C so that
% the spatiotemporal RF is more interesting?
\begin{figure}
\center
\includegraphics[width=0.9\textwidth]{./figures/example_RFs.pdf}
\caption{{\bf Example receptive fields in the LGN and V1.} (A) Schematic
of a typical LGN center-surround receptive field next to an example
recorded from an LGN ON cell. (B) Schematic of a typical V1 simple cell
receptive field next to an example recorded from a V1 cell. The two
examples are shown are recorded in cat and reproduced from
\citet{deangelis_tin95}. (C) A spatiotemporal receptive field recorded
from a macaque simple cell using subspace reverse correlation. The
inset number shows the time in milliseconds at which the RF is
computed. Reproduced from \citet{dario_jneurophys01}.}
\label{fig:example_RFs}
\end{figure}
The orientation-selective cells in V1 have a spatial
organization across the cortical surface that falls into two classes
when considering mammalian species. Rodents, for instance, have a ``salt
and pepper'' organization where orientations appear randomly distributed
down to the cellular level, as shown in Figure \ref{fig:example_OR_maps}A.
In contrast, carnivorans and primates such as macaque have a smooth orientation map
organization as seen in Figure \ref{fig:example_OR_maps}B and C. As the
model presented in this thesis aims to model the cortical response in
macaque, any orientation maps of the model should have this sort of
smooth organization.
\begin{figure}
\center
\includegraphics[width=0.9\textwidth]{./figures/rat_macaque_maps.pdf}
\caption{{\bf Example orientation maps in rat and macaque V1.} (A)
``Salt and pepper'' arrangement of orientation preference in rat V1 as
recorded with two-photon calcium imaging down to subcellular
resolution. Preferences are indicated by the cyclic color key on the
right. Reproduced from \citet{ohki_nature05}. (B) Orientation preference
map recorded using optical imaging in anesthetized macaque using the
same color key. The distance $\Lambda$ covers a change of $180^\circ$
and corresponds to the hypercolumn distance. The white circles mark
two pinwheel locations around which all preferences are
represented. These two pinwheels have opposite polarities with a
clockwise progression moving up the color key for the left pinwheel
and a clockwise progression down the color key for the pinwheel on the
right. (B) The corresponding orientation selectivity map. Reproduced
from \citet{blasdel_jn92b}.}
\label{fig:example_OR_maps}
\end{figure}
Smooth orientation maps have more identifiable structure than salt and
pepper arrangements. In particular, as the map varies smoothly,
hypercolumns can be identified as a continuous region over which the
full set of receptive-field parameters are covered. In the case of
hypercolumns, this corresponds to the average distance over which the
orientation preference cycles over $180^\circ$. The corresponding
circular feature where a $180^\circ$ change in orientation preference is
observed around a point is called a pinwheel. Pinwheels have two
different polarities depending on whether the orientation preference
increases or decreases when circling the pinwheel center
clockwise. Examples of both these features are shown in Figure
\ref{fig:example_OR_maps}B. The orientation selectivity map is also
smoothly varying as shown in Figure \ref{fig:example_OR_maps}C.
In summary, the visual system is composed of a large population of
neurons with a diversity of receptive field and tuning properties. There
is organization that can be observed at the level of individual neurons
such as the receptive fields of a particular cell shown in Figure
\ref{fig:example_RFs} and there is organization that is only apparent
across a large population of cells, such as the orientation maps shown
in Figure \ref{fig:example_OR_maps}.
From this evidence, it is clear that there are different spatial scales relevant
to the visual response, ranging from single-unit recordings to
measurements of entire feature maps. In the next portion of this
chapter, the ways activity can be recorded across these different scales
will be discussed. This will included a common experimental approach for
measuring activity at the level of an individual neurons and then a
discussion of optical imaging techniques used to record from a large,
spatially extended population of neurons at once.
\section{Dynamics of the evoked response}
\label{section:evoked_background}
The first step toward validating a model of neural response in V1 is to
consider the available experimental data in the fully developed, adult
animal. In this section, the observed experimental responses to
artificial stimuli in adult macaque V1 are discussed, both at the level
of individual neurons and across a spatially extended population.
First the local spiking response will be considered in terms of the
peristimulus time histogram (PSTH) profiles of both simple and complex
cells in macaque. The experimentally observed PSTH profiles are
summarized by the invariant response descriptive model developed by
\citet{albrecht_jneurophys02}.
Next the evoked dynamics across a large population of neurons is
considered using voltage-sensitive--dye imaging, also recorded in
macaque. This technique captures the evoked pattern of response over
several square millimeters of the cortical surface with a high temporal
resolution. The key properties of the observed spatiotemporal dynamics
are then summarized as a function of stimulus contrast.
These two experimental techniques yield very different temporal profiles
for the evoked response. Understanding how these two sources of data can
be consistently accounted for within a single model of the evoked
response is the basis of Chapter \ref{chapter:SIRD}.
\subsection{Local spiking responses}
The temporal properties of the spiking response of a neuron can be
recorded using an electrode with a high temporal resolution, then
expressed as a peristimulus time histogram (PSTH). Such recordings
typically have a high enough temporal resolution to resolve individual
action potentials in a localized volume of neural tissue. One way to
begin quantifying the dynamics of the response of individual neurons in
the visual system is to examine the properties of PSTH profiles evoked
by an appropriate test stimulus. In this section, the PSTH profiles of
both LGN and V1 neurons will be presented.
\subsubsection*{Spiking profiles in the LGN}
The mechanistic models we will consider later on simulate the
propagation of activity from the photoreceptors in the retina to V1 via
the LGN. Therefore, in order to understand what drives the spiking
responses in V1 mechanistically, it is first useful to examine the
spiking response profiles in the LGN.
Figure \ref{fig:LGN_PSTH_maunsell} shows average PSTH profiles for
magnocellular and parvocellular neurons in macaque LGN. Both types of
cell have a peak in spiking activity although the ratio of the peak to
the sustained response is lower in magnocellular neurons. These PSTHS
have been plotted on a $150$ millisecond axis to allow easy comparison
with the V1 PSTH profiles described in the next section.
\begin{figure}
\center
\includegraphics[width=0.9\textwidth]{./figures/LGN_PSTH_maunsell.pdf}
\caption{{\bf Average PSTH profiles for magnocellular and parvocellular
LGN neurons in anesthetized macaque.} Cells were stimulated by
$0.25^\circ$ radius spots that were either brighter (ON) or darker
(OFF) than the background by $28$ \si{cd/mm^{2}}. On the left, the
average PSTH profile for 78 magnocellular neurons is shown. On the
right, the average PSTH for 80 parvocellular neurons. Data reproduced
from \citet{maunsell_visneuro99}.}
\label{fig:LGN_PSTH_maunsell}
\end{figure}
\subsubsection*{The invariant response descriptive model}
\label{section:IRD_background}
The invariant response descriptive (IRD) model of
\citet{albrecht_jneurophys02} offers a mathematical description of the
experimentally observed spiking response of V1 cells. This
phenomenological model summarizes the observed PSTH profiles as a
function of stimulus contrast for simple and complex cells of adult cat
and monkey. For a population of 50 cells, this model was found to
account for approximately 94\% of the variance observed across the
microelectrode recordings and will serve as a way to quantify the
properties of ``typical'' PSTH profiles.
The temporal spiking response profiles of cortical neurons vary in both
shape and amplitude according to the particular cell that is being
recorded, as well as the shape of the driving stimulus. It is nonetheless
useful to try to capture the general properties of observed PSTH
profiles with a simple descriptive model.
The invariant response descriptive (IRD) model is a phenomenological model
that captures the shape of a typical PSTH profiles over 200 milliseconds
in response to the presentation of a stationary sinusoidal grating
pattern at a fixed contrast. First, the profile shape is approximated in
a piecewise manner using a Gaussian function up to the peak value at
$\tau_c$ and a ``$\frac{1}{2}$ Gaussian'' profile to capture the
sustained response thereafter:
%%
\begin{equation}
\label{eq:IRD_half_gaussians}
r_t(t) =
\begin{cases}
\exp \left( -\ln 2 \frac{(t - \tau_c(c))^2)}{\sigma^2_a} \right) & t < \tau_c \\
\exp \left( -\ln 2 \frac{(t - \tau_c(c))^2)}{\sigma^2_b} \right) + (1 - \alpha) \exp \left( -\ln 2 \frac{(t - \tau_b(c))^2)}{\sigma^2_c} \right) & t\geq \tau_c
\end{cases}
\end{equation}
%%