-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathhm.tex
6838 lines (5928 loc) · 418 KB
/
hm.tex
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
\documentclass[english,fontsize=11pt,paper=b5]{scrbook}
\usepackage{iftex}
\ifPDFTeX
\usepackage{fourier} % pdflatex or dvi latex
\usepackage[T1]{fontenc}
\usepackage[utf8]{inputenc}
\else
\usepackage{fontspec} % XeLaTeX or LuaLaTeX
\setmainfont[Renderer=Basic, Numbers=OldStyle, Scale = 1.0]{TeX Gyre Pagella}
\setsansfont[Renderer=Basic, Scale=0.90]{TeX Gyre Heros}
\setmonofont[Renderer=Basic]{TeX Gyre Cursor}
\fi
\usepackage[
HomeHTMLFilename=index, % Filename of the homepage.
HTMLFilename={chapter-}, % Filename prefix of other pages.
% IndexLanguage=english, % Language for xindy index, glossary.
mathjax, % Use MathJax to display math.
makeindex
]{lwarp}
\setcounter{FileDepth}{0}
\boolfalse{FileSectionNames} % Number the file names
\booltrue{CombineHigherDepths} % Combine parts/chapters/sections
\HTMLLanguage{en-UK}
\HTMLDescription{Lecture notes for Hamiltonian Mechanics}
\usepackage{makeidx}
\usepackage{babel}
\usepackage{hyperref}
\hypersetup{
colorlinks,
linkcolor={blue!60!black},
citecolor={blue!60!black},
urlcolor={blue!60!black},
linktoc=page,
hypertexnames=false}
\usepackage{booktabs}
\usepackage{xcolor}
\usepackage{graphicx}
\usepackage{amsmath, amssymb, amsthm}
\numberwithin{equation}{chapter}
\usepackage{physics} % documentation at https://mirror.koddos.net/CTAN/macros/latex/contrib/physics/physics.pdf
\usepackage{units}
\usepackage{tikz}
\tikzset{every picture/.style={ampersand replacement=\&}}
\usepackage{pgfplots}
\usepackage{tikz-3dplot}
\pgfplotsset{compat=1.16}
\input{insbox.tex}
\usepackage{tcolorbox}
% uncomment once no todo is left
\usepackage{todonotes}
% comment before publication
%\usepackage{showlabels}
\PassOptionsToPackage{ type={CC}, modifier={by-nc-sa}, version={4.0}, }{doclicense}
\usepackage{doclicense}
\DeclareTextCommandDefault{\textbullet}{\ensuremath{\bullet}}
\usepackage[backend=bibtex, style=alphabetic, natbib=true, sortcites=false, noerroretextools]{biblatex}
\addbibresource{hm.bib}
% workaround needed for autonum
\let\etoolboxforlistloop\forlistloop
\usepackage{autonum}
\let\forlistloop\etoolboxforlistloop
\begin{warpprint}
\usepackage{picins}
%\usepackage[numbers, sort]{natbib}
%\setlength{\bibsep}{3pt}
%\renewcommand{\bibfont}{\small}
\usepackage{doi}
%\bibliographystyle{plainnat}
\end{warpprint}
\begin{warpHTML}
\newcommand{\doi}[1]{\href{https://doi.org/#1}{#1}}
%\bibliographystyle{alpha}
\end{warpHTML}
\DeclareMathOperator{\D}{D}
\DeclareMathOperator{\Id}{Id}
\DeclareMathOperator{\diag}{diag}
\let\mod\relax
\DeclareMathOperator{\mod}{mod}
\DeclareMathOperator{\Vol}{Vol}
\begin{warpMathJax}
\CustomizeMathJax{
%\newcommand{\vb*}{\boldsymbol}
\DeclareMathOperator{\D}{D}
\DeclareMathOperator{\Id}{Id}
\DeclareMathOperator{\diag}{diag}
\DeclareMathOperator{\mod}{mod}
\DeclareMathOperator{\Vol}{Vol}
}
\end{warpMathJax}
\newtheorem{theorem}{Theorem}[chapter]
\newtheorem{proposition}[theorem]{Proposition}
\newtheorem{lemma}[theorem]{Lemma}
\newtheorem{corollary}[theorem]{Corollary}
\newtheorem{definition}{Definition}
\theoremstyle{definition}
\newtheorem{remark}{Remark}[chapter]
\newtheorem{example}{Example}[chapter]
\newtheorem{exercise}{Exercise}[chapter]
\usepackage[toc,page]{appendix}
\usepackage{subfiles}
\title{Hamiltonian Mechanics}
\author{Marcello Seri\\
\small{Bernoulli Institute}\vspace{-.2cm}\\
\small{University of Groningen}\vspace{-.2cm}\\
\small\href{mailto:[email protected]}{m.seri (at) rug.nl}
}
\date{}
\usepackage{scrhack}
\newcommand{\emphidx}[1]{\index{#1}\emph{#1}}
\makeindex
\begin{document}
\maketitle
\cleardoublepage
\thispagestyle{empty}
\null\vfill
\begin{center}
Version 1.20 $\alpha$2\\
\today
\end{center}
\begin{warpprint}
\vfill
\small{\doclicenseThis}
\end{warpprint}
\cleardoublepage
\pagenumbering{roman}
\tableofcontents
\cleardoublepage
\pagenumbering{arabic}
\chapter*{Preface}
\todo{Rewrite}
The literature on classical (or analytical, as it was called by Lagrange) mechanics is full of good material.
Different sources present the topic from different perspectives and with different points of view, and may suite different people differently.
In these lecture notes I am iterating on my perspective.
The approach I am taking has been heavily influenced by \cite{book:arnold, book:knauf, lectures:dubrovin, book:lowenstein, book:marsdenratiu, lectures:tong, landau1976mechanics}.
The book \cite{book:knauf} will be a good extra reference for the course. In addition to being a good introduction to many topics in classical mechanics that we will not have time to discuss during the lectures, it covers almost all the material that we will treat in chapters 1, 6, 8, 10, 11, 13, 15. Furthermore, the book can be freely and legally accessed via the University proxy using the \href{https://link.springer.com/book/10.1007%2F978-3-662-55774-7}{SpringerLink} service.
I had lots of fun reading \cite{schwichtenberg2019no}, if none of the references above satisfies you, consider having a look at that. And for an unusual approach to the topic, centered around the idea that everything should be explicit enough to be directly computable by a computer, you can have a look at the marvellous \cite{book:sicm}. Finally, a good and enjoyable classical reference is \cite{goldstein2013classical}.\medskip
These notes are not (yet?) exhaustive.
They will be updated throughout the course, and it will likely take a few years of course iterations before they fully stabilize.
Some topics, examples and exercises discussed in class will not be in these notes, but may appear as examples, exercises or problems in the literature presented above or on the material posted in the course webpage.
Throughout the course, we will discuss the main ideas in Newtonian, Lagrangian and Hamiltonian mechanics and the relations between them.
This will include symmetries and elementary phase space reduction, normal modes and small oscillations.
We will then move to study action--angle coordinates and integrability, and finally we will discuss elementary perturbation theory.
On the latter, we will only briefly discuss resonances and mostly focus on the meaning of the Kolmogorov-Arnold-Moser theorem and the Nekhoroshev theorem.
Topics that I intend to add over time include: contact mechanics, non-holonomic mechanics, sub-riemannian geometry, numerical methods, rigid bodies, mathematical billiards, integrability via Lax pairs... I don't know if this is just whishful thinking or if it will happen at some point, but I welcome any contribution in these directions.
A number of extra references covering some of the topics mentioned above is \href{https://www.mseri.me/links-from-hm/}{collected on my blog}. I will make sure to keep the post updated and the links working. \medskip
Please don't be afraid to send me comments to improve the course or the text and to fix the many typos that will surely be in this first draft. They will be very appreciated.
I am extremely grateful to Nithesh Balasubramanian, Senan Bird, Riccardo Bonetto, Jose\-phine van Driel, Ramsay Duff, Brian Elsinga, Mollie Jagoe-Brown, Jesse Mulder, Ruxandra Nastase, Dijs de Neeling, Anouk Pelzer, Iisekki Rotko, Danique de Ruiter, Robbert Scholtens, Felix Semler, Albert \v{S}ilvans, Marit van Straaten and Jermain Wall\'e for their careful reading of the notes and their useful comments and corrections.
Last but not least, I owe a huge debt of gratitude to \href{https://crojasmolina.com}{Constanza Rojas-Molina}, who kindly allowed me to use some of her beautiful artworks in these notes.
\chapter{Classical mechanics}
In this chapter we will review some basic concepts of classical mechanics.
In particular we will briefly discuss variational calculus, Lagrangian mechanics and Newtonian mechanics, superficially presenting along the way some simple examples to motivate part of the rest of the course.
For a deeper and more detailed account, you can refer to \cite{book:arnold,book:knauf}.
\section{Newtonian mechanics of point particles}
In the elementary formulation we will focus on, our primary interest is in describing the equations of motion for an idealized \emphidx{point particle}.
This is a point--like object obtained by ignoring the dimensions of the physical object.
Note that in many cases this is a reasonable first approximation.
For example, when describing planetary motion around the sun, we can consider the planet and the sun as two point particles without significantly affecting the qualitative properties of the system.
After all the sun is about 150 million kilometers away from the Earth, compared to which their sizes are negligible.
The diameter of the sun is just 0.9\% of this distance and the diameter of the Earth a mere 0,008\%. See Figure~\ref{fig:sun-earth-scale}.
\begin{figure}
\centering
\includegraphics[width=.9\linewidth]{images/sun-earth-scale.pdf}
\caption{The sun and the Earth to scale. Everything is in the correct scale, there is a --practically invisible-- blue dot at the end of the line}\label{fig:sun-earth-scale}%
\end{figure}
Of course this is not a universal simplification, even for celestial systems: for instance, we cannot do it when describing the motion of a planet around its axes.
In this case, the shape and the internal structure of the body becomes to relevant to ignore.
A point particle is first of all a point, a dimensionless mathematical object in space: its \emphidx{position} in space is described by the position vector $\vb*{x} = (x, y ,z)$.
Keep in mind that
\begin{equation}
\vb*{x} : \mathbb{R}\to\mathbb{R}^3,\quad t \mapsto \vb*{x}(t),
\end{equation}
is a function of time that describes the instantaneous state of the system during its evolution.
In most cases, this will be implicitly assumed and we will omit the explicit dependence on $t$.
The \emphidx{velocity} of the point particle is given by the rate of change of the position vector,
i.e., its derivative with respect to time\footnote{Notation: the symbol $a := b$ means that $a$ is defined by the expression $b$. Similarly $b =: a$ is the same statement but read from right to left.}
\begin{equation}
\vb*{v} = \dv{\vb*{x}}{t} =: \dot{\vb*{x}} = (\dot{x}, \dot{y}, \dot{z}).
\end{equation}
%
We call \emphidx{acceleration}, the rate of change of the velocity, i.e., the second derivative
\begin{equation}
\vb*{a} = \dv[2]{\vb*{x}}{t} =: \ddot{\vb*{x}} = (\ddot{x}, \ddot{y}, \ddot{z}).
\end{equation}
For us, the main distinction between a mathematical point and a point particle, is that the latter usually carries a \emph{mass} $m$.
This is a scalar quantity that, as we will see, measures its resistance to changes in its state of motion, also known as \emphidx{inertia}.
\begin{tcolorbox}[title=Newton's second law of motion]
\index{Newton!second law}
There exist \emphidx{frames of reference}, that is, systems of coordinates, in which the motion of the particle is described by a differential equation involving the forces $\vb*{F}$ acting on the point particle, its mass $m$ and its acceleration as follows
\begin{equation}\label{eq:newton}
\vb* F = m \ddot{\vb*{x}}.
\end{equation}
\end{tcolorbox}
Note that the law as described above is not completely true: Newton was already talking about momentum, which \href{https://web.archive.org/web/20211201082909/https://bigthink.com/starts-with-a-bang/most-important-equation-physics/}{makes a deep difference}, but would set us off-course right now. \medskip
Before moving on, let's anticipate three examples that will come back over and over in the course of this book.
Here we will just sketch them, but we will come back to them in more detail later.
\begin{example}[Horizontal spring and pendulum]\label{ex:sprPen}
\index{spring}\index{pendulum}
Consider an ideal spring, that is, an idealized system consisting of a point particle of mass $m$ attached to a spring with stiffness $k$, sliding on a frictionless surface.
Assume that the motion is one-dimensional, along the axis of the spring, and let $x$ denote the displacement of the system from its equilibrium position, i.e., the position in which the spring is completely at rest: not compressed nor extended.
It is convenient to assume that the sliding happens on a flat surface.
This allows us to exclude gravitational forces from the picture, making this example as simple as it could be.
\begin{figure}[ht!]
\centering
\includegraphics[width=\linewidth]{images/HM-1-2.pdf}
\caption{Left: horizontal spring. Right: planar pendulum.}%
\label{fig:spring-pendulum}
\end{figure}
\emph{Hooke's law} \index{spring!Hooke's law} states that the restoring force $F$ exerted by an ideal spring is directly proportional to its displacement $x$ from equilibrium.
The law is expressed mathematically as $F(x) = -kx$, where $k$ is the spring constant\index{spring!constant}, a measure of the spring's stiffness.
The negative sign indicates that the force acts in the opposite direction of the displacement, always seeking to restore the spring to its equilibrium position. See Figure~\ref{fig:spring-pendulum}, left panel.
According to \eqref{eq:newton}, then, the motion of the point particle is given by
\begin{equation}\label{eq:spring}
m \ddot{x} = - k x \qquad\mbox{or}\qquad \ddot{x} = - \omega^2 x \quad\mbox{where } \omega = \sqrt{k/m}.
\end{equation}
The solution, $x(t)$, is generally described by
\begin{equation}\label{eq:springsol}
x(t) = R \cos(\omega t + \phi),
\end{equation} with the unknowns $R\in\mathbb{R}$ and $\phi\in[0,2\pi)$ uniquely prescribed by the initial conditions
\begin{equation}
x(0) = R\cos(\phi) \qquad\mbox{and}\qquad \dot x(0) = -\omega R \sin(\phi).
\end{equation}
Once we know the initial conditions, the full evolution of the solution $x(t)$ is known.
\medskip
Consider, now, an ideal pendulum \index{pendulum!ideal}. That is, a point particle of mass $m$ attached to a pivot on the ceiling via a rigid rod of length $l$.
Assume the motion is frictionless and happening only in a vertical plane.
Let $x$ denote the angle of displacement of the system from its equilibrium position on this plane, i.e., the lowest point on the arc of motion.
Without loss of generality, we can assume the angle at equilibrium to be zero, with positive sign on the right hand side of the vertical, and negative on the left. See Figure~\ref{fig:spring-pendulum}, right panel.
The force acting on the pendulum is Earth's gravitational attraction.
According to \eqref{eq:newton}, then, the motion of the point particle is given by
\begin{equation}
m l \ddot{x} = - m g \sin(x) \qquad\mbox{or}\qquad \ddot{x} = - \omega^2 \sin(x) \quad\mbox{where } \omega = \sqrt{g/l}.
\end{equation}
Here, $g \approx 9.8 m s^{-2}$ denotes the gravitational acceleration.
Although it is possible to solve the equation of motion of the pendulum explicitl yby means of \emphidx{elliptic integrals}~\cite{elliptic}, this is rather cumbersome.
In some cases, when $\sin x \approx x$, we can simplify our life and, instead, use the equation of the spring as a model for the pendulum oscillation via the so-called \emph{small oscillations} approximation.
We will come back to this later on.
\end{example}
\begin{example}[Idealized motion of the Earth around the Sun]\label{ex:Kepler0}
Let us approximate the Sun with a point particle of mass $M$ positioned at the origin $\vb*{0}\in\mathbb{R}^3$ of the Euclidean space.
In this model of the solar system, with the Sun fixed at the origin, we will describe the Earth by a point particle of mass $m$ whose position (and motion) is described by a vector $\vb*{x}\in\mathbb{R}^3$.
Due to our choice of coordinates, the gravitational attraction of the Sun acts in the direction of $-\vb*{x}(t)$.
\emph{Newton's law of universal gravitation} \index{Newton!universal gravitation} says that such a force is proportional to
\begin{equation}
\frac{GmM}{\|\vb*{0}-\vb*{x}\|^2} = \frac{GmM}{\|\vb*{x}\|^2},
\end{equation}
where $G \sim 6.674 \cdot 10^{-11} \frac{m^3}{s^2\,kg}$ is called the \emphidx{gravitational constant}.
Newton's second law \eqref{eq:newton}, then, leads to the equation of motion
\begin{equation}\label{eq:keplerex}
m \ddot{\vb*{x}} = - \frac{GmM}{\|\vb*{x}\|^2} \frac{\vb*{x}}{\|\vb*{x}\|}.
\end{equation}
This is an autonomous second order ordinary differential equation on the configuration space $\mathbb{R}^3\setminus\big\{\vb*{0}\big\}$.
Providing the initial conditions $\vb*{x}(0)=\vb*{x}_0$ and $\dot{\vb*{x}}(0)=\vb*{v}_0$, we can try to solve \eqref{eq:keplerex}, and you are welcome to try.
As it is often the case, though, things can become easier by taking a step back and looking at the problem differently.\medskip
Behind differential equations in classical mechanics lies a surprisingly rich geometrical structure, in which symmetries and conserved quantities play a special role.
These can help to obtain extensive information on the solution of classical equations of motion without the need to explicitly solve the equations (which, in general, is impossible).
Let's have an initial brief look at this in the context of the Kepler problem.
Consider the space $\big(\mathbb{R}^3\setminus\big\{\vb*{0}\big\}\big)\times\mathbb{R}^3$, and define there, for the moment without further justification or explanation, the total energy function
\begin{equation}\label{eq:energyKepler}
E(\vb*{x},\vb*{v}) = \frac{1}{2}m\|\vb*{v}\|^2 - \frac{GmM}{\|\vb*{x}\|},
\end{equation}
the angular momentum
\begin{equation}
L(\vb*{x},\vb*{v}) = m \vb*{v} \times \vb*{x},
\end{equation}
and the Laplace-Runge-Lenz vector
\begin{equation}
A(\vb*{x},\vb*{v}) = m \vb*{v} \times L(\vb*{x}, \vb*{v}) + \frac{G m^2 M^2}{m+M} \frac{\vb*{x}}{\|\vb*{x}\|}.
\end{equation}
Along the solutions $\vb*{x}(t)$ of \eqref{eq:keplerex}, let us define $E(t) := E(\vb*{x}(t),\dot{\vb*{x}}(t))$ and, similarly, $L(t)$ and $A(t)$.
In due time we will show that, $L(t) = L(0) \neq 0$ for all times, and also $E(t) = E(0)$ and $A(t) = A(0)$ are constant for all times.
Furthermore, any solution that lives on the subspace defined by
\begin{align}
\big\{
(\vb*{x}, \vb*{v})\in \big(\mathbb{R}^3\setminus\big\{\vb*{0}\big\}\big)\times\mathbb{R}^3 \;\mid\;
E(\vb*{x},\vb*{v}) = E(\vb*{x}_0, \vb*{v}_0),\;
L(\vb*{x},\vb*{v}) = L(\vb*{x}_0, \vb*{v}_0),\;
A(\vb*{x},\vb*{v}) = A(\vb*{x}_0, \vb*{v}_0)
\big\},
\end{align}
must be a conic of the following type
\begin{equation}
\begin{split}
\mbox{ellipse} \quad \mbox{if} \quad E(t) = E(0) < 0, \\
\mbox{parabola} \quad \mbox{if} \quad E(t) = E(0) = 0, \\
\mbox{hyperbola} \quad \mbox{if} \quad E(t) = E(0) > 0.
\end{split}
\end{equation}
This is an example of a central force field, and is one of the most prominent and most important examples in this course.
The impatient reader can find in \cite[Ch. 1]{book:knauf} a nice and compact derivation of Kepler's laws and the invariants above from \eqref{eq:keplerex}.
\end{example}
\subsection{From particles to systems of particles}
It is a bit limiting to consider only systems with one particle and, indeed, many interesting problems in classical mechanics involve systems on interacting particles.
In general a system of $N$ point particles \index{point particle!system} will be described by a set of $N$ position vectors $\vb*{x}_k = (x_k, y_k ,z_k)$ with masses $m_k$, $k = 1, \ldots, N$.
For convenience we will denote $\vb*{x} = (\vb*{x}_1, \ldots, \vb*{x}_N)\in\mathbb{R}^{3N}$, and $\vb*{m} = (m_1, \ldots, m_N)\in\mathbb{R}^N$.
We call $\vb*{x}(t)$ the \emphidx{configuration} of the system at time $t$ in the \emph{configuration space} \index{configuration!space} $\mathbb{R}^{3N}$.
Note that we are identifying $\mathbb{R}^{3\times N}$, the space of $3\times N$ matrices, and $\mathbb{R}^{3N}$, the space of $3N$ vectors. Namely, $\vb*{x} = (\vb*{x}_1, \ldots, \vb*{x}_N) = (x_1, y_1, z_1, x_2, y_2, z_2, \ldots, x_N, y_N, z_N)$ is used interchangeably as the vector of positions of the points in three-space or as the vector including all the positions of the $N$ bodies together.
\begin{example}\label{example:gcoords}
A system of two ideal pendulums is described by two position vectors, so $\vb*{x} = (\vb*{x}_1, \vb*{x}_2)\in\mathbb{R}^{6}$.
Notice, however, that to describe their configuration we only need \emph{two angular variables}, one for each of the pendulums.
So, for all practical purposes, the system could be completely described by $q = (q^1, q^2) \in \mathbb{S}^1\times\mathbb{S}^1 \simeq \mathbb{T}^2$. See Figure~\ref{fig:twopend}.
\begin{figure}[ht!]
\centering
\includegraphics[width=0.9\linewidth,trim={0 1cm 0 1cm}, clip]{images/HM-1-1.pdf}
\caption{Left: a system of two decoupled pendulums in $\mathbb{R}^3$. Right: corresponding generalized coordinates.}%
\label{fig:twopend}
\end{figure}
The symbol $\simeq$ usually denotes some kind of equivalence, but which specific kind is context-dependent and not often well explicited.
So, let us take this opportunity to clarify the notation.
What we wrote above, $\mathbb{S}^1\times\mathbb{S}^1 \simeq \mathbb{T}^2$, should be read as: the 2-torus, i.e., the surface of a doughnut, is \emphidx{diffemorphic} to the product of two circles. Here, diffeomorphic is a concept from the theory of smooth manifolds, and stands for the existence a smooth bijection between the two constructions.
If we then think of a circle $\mathbb{S}^1$ as the interval $[0, 2\pi)$ with the endpoints identified, the observation above is saying that the torus $\mathbb{T}^2$ can be thought of as the square $[0, 2\pi)\times[0, 2\pi)$ with the edges identified in the usual way and $q = (q^1, q^2) \in [0, 2\pi)\times[0, 2\pi) \subseteq \mathbb{R}^2$.
Such a long story to say that, while in principle this system is 6-dimensional, for all practical purposes it is 2-dimensional.
\end{example}
As exemplified by the example above, we want to set up a formalism that allows us to describe the configuration of a system in a way that is independent of the number of particles and instead captures the minimal number of parameters that are really necessary to describe it.
We say that a system of $N$ particles has \emph{$n$ degrees of freedom} \index{degrees of freedom} if we need $n$ independent parameters to uniquely specify the system configuration.
We call \emph{generalized coordinates} \index{generalized!coordinates}any set of $n$ parameters $q = (q^1, \ldots, q^n)$ that uniquely determine the configuration of a system with $n$ degrees of freedom, and \emph{generalized velocities} \index{generalized!velocities} their time derivatives $\dot q = (\dot q^1, \ldots, \dot q^n)$.
The \emph{state} \index{state space} of the system is then characterized by the set of (generalized) coordinates and velocities $(q, \dot q) = \left(q^1, \ldots, q^n,\dot q^1, \ldots, \dot q^n\right)$.
As Example~\ref{example:gcoords} shows, the $n$ degrees of freedom do not have to be the cartesian coordinates of the point particles.
If you recall differential geometry, you may (correctly) guess that the generalized coordinates will be points on some differentiable manifold $q\in M$, their evolution will be described by a curve $q: \mathbb{R} \to M$ parametrized by time and the state of the system will be a point in the tangent bundle $(q, \dot q)\in TM$, i.e., $\dot q \in T_q M$. If you don't have any previous experience with these concepts, don't dispare! We will take our time to introduce them as they appear throughout the course. See also section~\ref{sec:lagrangianonmanifold}).
\medskip
We have now all the elements to translate the \emph{Newton's principle of determinacy} \index{Newton!principle of determinacy} in mathematical terms.
In 1814, Laplace \cite{book:laplace} wrote
\begin{quotation}
We may regard the present state of the universe as the effect of its past and the cause of its future. An intellect which at a certain moment would know all forces that set nature in motion, and all positions of all items of which nature is composed, if this intellect were also vast enough to submit these data to analysis, it would embrace in a single formula the movements of the greatest bodies of the universe and those of the tiniest atom; for such an intellect nothing would be uncertain and the future just like the past would be present before its eyes.
\end{quotation}
In other words, this principle states the following.
\begin{tcolorbox}[title=Newton's principle of determinacy]
The initial state $\left(q(t_0), \dot q(t_0)\right) \in \mathbb{R}^n$ of a physical system with $n$ degrees of freedom, uniquely determines its evolution $\left(q(t),\dot q(t)\right)$ for all $t > t_0$.
\end{tcolorbox}
We had already observed this fact in Example~\ref{ex:sprPen} of the pendulum, where the initial position and velocity uniquely determined the whole trajectory.
Picard-Lindel\"of theorem, also known as ``Existence and uniqueness of solutions of initial value problems'' \cite[Theorem 3.17]{book:knauf}, implies that Newton's principle of determinacy is locally satisfied by the \emphidx{equations of motion} of most mechanical systems, i.e., second order differential equations derived from Newton's law.
\section{Hamilton's variational principle}\label{sec:varpri}
In order to leave more space to discuss Hamiltonian systems and their geometry, we will be brief in our account of Lagrangian mechanics and calculus of variations, although not as brief as this \href{https://web.archive.org/web/20220404153248/https://twitter.com/j\_bertolotti/status/1397159397596581889}{twitter thread}.
Our quick treatment shouldn't mislead you, though. Lagrangian mechanics is just as crucial as Hamiltonian mechanics in the grand scheme of classical physics.
In fact, many would argue that the most general formulation of motion equations in classical mechanics comes from the \emph{principle of least action}, also known as \emph{Hamilton's variational principle}.
This principle, introduced by Hamilton in 1834, suggests that a mechanical system's equations of motion are characterized by a function
\begin{equation}
L \equiv L(q, v, t) : \mathbb{R}^n \times \mathbb{R}^n \times \mathbb{R} \to \mathbb{R},
\end{equation}
called the \emphidx{lagrangian} (function) of the system.
\begin{example}
The lagrangian of a mechanical system consisting of a point particle with mass $m > 0$ in a potential $U : \mathbb{R}^n \to \mathbb{R}$ is
\begin{equation}
L(q, v, t) = \frac12 m \|v\|^2 - U(q),
\end{equation}
which is the difference between the so-called \emph{kinetic energy} of the particle and its so-called \emph{potential energy} $U$.
We will see where this equation comes from in Section~\ref{sec:dynamicspps}.
\end{example}
Given a curve $\gamma:[t_1, t_2] \to \mathbb{R}^n$, we define the \emphidx{action} functional as
\begin{equation}\label{eq:Laction}
S[\gamma] := \int_{t_1}^{t_2} L(\gamma(s), \dot \gamma(s), s) \dd s.
\end{equation}
\begin{tcolorbox}[title=Principle of least action]
\index{principle of least action}\index{Hamilton's principle}
Consider a system with $n$ degrees of freedom which is in the configuration $q_1 = (q_1^1, \ldots, q_1^n)$ at an initial time $t_1$ and $q_2 = (q_2^1, \ldots, q_2^n)$ at a final time $t_2 > t_1$.
The \emph{principle of least action}, or \emph{Hamilton's principle}, states that the evolution of the system in the time interval $[t_1, t_2]$ corresponds to the curve $q(t)$ which is the \emph{critical point} of the action functional $S[q]$ on the space of curves $\gamma:[t_1, t_2] \to \mathbb{R}^n$ with fixed endpoints $\gamma(t_1) = q_1$ and $\gamma(t_2) = q_2$.
\end{tcolorbox}
To make this precise, we will need to recall some preliminary concepts and make sense of differentiation in $\infty$-dimensional spaces.\medskip
We will present the theory in the general setting of \emphidx{Banach spaces}, that is, complete normed vector spaces. If $X$ is a Banach space, then we will denote the corresponding norm by $\|\cdot\|_X$.
Let $X$ and $Y$ be Banach spaces and $G\subset X$ an open subset of $X$.
A function $f: G \to Y$ is called \emph{Fr\'echet differentiable} \index{Frechet!differentiable} at $x\in G$, if there exists a bounded linear operator $A: X \to Y$, such that
\begin{equation}\label{eq:frechetdiff}
f(x+h) = f(x) + Ah + o(\|h\|_X)
\end{equation}
asymptotically as $\|h\|_X\to 0$, that is, for any $h$ in a sufficiently small neighborhood of $0\in X$.
Here, we write $g = o(\|h\|_X)$ if $g : X \to Y$ satisfies
\begin{equation}
\lim_{\|h\| \to 0} \frac{\|g(h)\|_Y}{\|h\|_X} = 0.
\end{equation}
As in the finite-dimensional case, $A$ is uniquely determined and is called the \emph{Fr\'echet derivative} \index{Frechet!derivative} of $f$ at $x$, which we will denote $D f(x)$.
\begin{remark}
\begin{enumerate}
\item In the finite dimensional setting, Fr\'echet differentiability corresponds to total differentiability.
\item As in the finite dimensional case, Fr\'echet differentiability implies the continuity of the mapping.
\item The analogy with the finite dimensional case goes further. Indeed, the chain rule, mean value theorem, implicit function theorem, inverse mapping theorem and the statements about local extremes with and without constraints, all hold also for Fr\'echet differentiable functions on Banach spaces.
\item Requiring the operator $A$ above to be bounded is crucial: in $\infty$-dimensional normed spaces, linearity does not imply continuity.
\item In calculus of variation, the curve $h$ from the small neighborhood of $0\in X$, is usually called a \emphidx{variation} and denoted $\delta x$. Don't confuse this with a Dirac delta function or a small real parameter.
\end{enumerate}
\end{remark}
Let $f: X \to \mathbb{R}$ be a (Fr\'echet) differentiable function and $X_0 \subset X$ be a subspace of $X$. Then $\gamma_\star$ is a \emph{critical point} \index{action!critical point} of $f$ with respect to $X_0$ if
\begin{equation}
Df\big(\gamma_\star\big)\Big|_{X_0} = 0, \quad\mbox{i.e.}\quad
Df\big(\gamma_\star\big)h = 0 \mbox{ for all } h\in X_0.
\end{equation}
%
It is possible to show that the space of curves
\begin{equation}
\mathcal{C}^2 := \big\{ \gamma: [t_1, t_2] \to M \mid \gamma \mbox{ is twice continuously differentiable}\big\},
\end{equation} equipped with the norm
\begin{equation}
\|\gamma\|_{\mathcal{C}^2} :=
\|\gamma\|_\infty + \|\dot \gamma\|_\infty + \|\ddot \gamma\|_\infty,
\end{equation}
is a Banach space, and $\mathcal{C}^2_0 = \big\{h\in \mathcal{C}^2 \mid h(t_1) = h(t_2) = 0\big\}$ with the induced norm, is a Banach subspace of $\mathcal{C}^2$.
Therefore, the action defined above is a functional
\begin{equation}
S : \mathcal{C}^2 \to \mathbb{R},\qquad \gamma \mapsto S[\gamma],
\end{equation}
and the evolution of the system is described by the critical points with respect to $\mathcal{C}^2_0$ of $S$ on the space of $\gamma \in \mathcal{C}^2$ with prescribed endpoints.
%TODO: Consider rewriting using q and v instead of qdot.
\begin{theorem}
Let $L = L(q, \dot q, t) : \mathbb{R}^{n}\times \mathbb{R}^{n}\times \mathbb{R} \to \mathbb{R}$ be differentiable.
The equations of motion for the mechanical system with lagrangian $L$ are given by the \emphidx{Euler-Lagrange equations}
\begin{equation}\label{eq:eulerlagrange}
\dv{t}\pdv{L}{\dot q^i} - \pdv{L}{q^i} = 0, \quad i=1,\ldots n.
\end{equation}
\end{theorem}
\begin{remark}
Be careful: when we omit the indices $i$, we use $\pdv{L}{q}$ to denote the gradient of $L$ with respect to the position variables $q$, and $\pdv{L}{\dot q}$ the gradient of $L$ with respect to velocity variables $\dot q$.
%
In particular, $\dot q$ in $\pdv{L}{\dot q}$ serves as a label to denote the velocity variable, and \textbf{not} as the derivative of $q$ with respect to time. We consider $q$ and $\dot q$ as curves parametrised by time only when we apply $\dv{t}$.
Therefore, you should read the Euler-Lagrange equations above as
\begin{equation}
\dv{t}\Bigg(\pdv{L(x,v)}{v^i}\Big|_{(x,v) = (q(t),\dot q(t))}\Bigg) - \pdv{L(x,v)}{x^i}\Big|_{(x,v) = (q(t),\dot q(t))} = 0, \qquad i=1,\ldots n.
\end{equation}
This explicit formulation, though precise, illustrates why such notational shortcuts are common and why I chose to adopt them.
\end{remark}
\begin{proof}
We need to show that any critical point of $S$ with respect to $\mathcal{C}^2_0$ has to satisfy \eqref{eq:eulerlagrange}.
First of all observe that for small $h\in \mathcal{C}^2_0$, we get
\begin{align}
S(\gamma + h) &= \int_{t_1}^{t_2} L(\gamma + h, \dot \gamma + \dot h, s) \dd s \\
&= \int_{t_1}^{t_2} % not clear how this step happens, specifically where the inner product comes from, maybe a comment on the procedure beforehand
L(\gamma, \dot \gamma, s) \dd s \\
&\quad + \int_{t_1}^{t_2} \left[
\left\langle
\pdv{L}{q}(\gamma, \dot \gamma, s),\;
h(s)
\right\rangle
+ \left\langle
\pdv{L}{\dot q}(\gamma, \dot \gamma, s),\;
\dot h(s)
\right\rangle
\right] \dd s \\
&\quad + O(\|h\|^2_{\mathcal{C}^2}),
\end{align}
where the inner product $\langle\cdot,\cdot\rangle$ is the usual scalar product in $\mathbb{R}^n$, and the last identity follows from applying a Taylor expansion of $L$ to second order around $(\gamma, \dot \gamma)$.
Therefore,
\begin{align}
S(\gamma+h) - S(\gamma) &= \int_{t_1}^{t_2} \left[
\left\langle\pdv{L}{q}(\gamma, \dot \gamma, s),\; h(s)\right\rangle
+ \left\langle\pdv{L}{\dot q}(\gamma, \dot \gamma, s),\; \dot h(s)\right\rangle
\right] \dd s\\
&\quad + O(\|h\|^2_{\mathcal{C}^2})\\
&= \left\langle\pdv{L}{\dot q}(\gamma, \dot \gamma, s),\; h(s)\right\rangle \Big|_{t_1}^{t_2} \\
&\quad + \int_{t_1}^{t_2} \left\langle
\pdv{L}{q}(\gamma, \dot \gamma, s)
- \dv{s}\pdv{L}{\dot q}(\gamma, \dot \gamma, s)
,\; h(s)\right\rangle \dd s\\
&\quad + O(\|h\|^2_{\mathcal{C}^2}).
\end{align}
The differential $DS(\gamma): {\mathcal{C}^2} \to \mathbb{R}$ can now be read from the equation above and is well--defined and is a bounded linear operator for all $\gamma\in {\mathcal{C}^2}$. Let's look at it term by term.\medskip
For $h\in \mathcal{C}^2_0$, the first term $\left\langle\pdv{L}{\dot q}(\gamma, \dot \gamma, s),\; h(s)\right\rangle\Big|_{t_1}^{t_2}$ has to vanish. Therefore, for $\gamma$ to be a critical point for $S$ it follows that the inner product in the integral has to vanish as well, i.e.,
\begin{equation}
\left\langle
\pdv{L}{q}(\gamma, \dot \gamma, s)
- \dv{s}\pdv{L}{\dot q}(\gamma, \dot \gamma, s)
,\; h(s)\right\rangle = 0 \quad\mbox{for all } h\in \mathcal{C}^2_0.
\end{equation}
%
Our choice of $h$ is arbitrary, so after a relabeling of the time, this implies
\begin{equation}\label{eq:EL-from-proof}
\pdv{L}{q}(\gamma, \dot \gamma, t)
- \dv{t}\pdv{L}{\dot q}(\gamma, \dot \gamma, t) = 0.
\end{equation}
Why is that the case? Assume that \eqref{eq:EL-from-proof} is non vanishing, then you can choose an $h$ with vanishing endpoints but non vanishing on the support of \eqref{eq:EL-from-proof}. With such an $h$ the integral above is strictly positive, contradicting the hypothesis.
Once we look at \eqref{eq:EL-from-proof} componentwise, we obtain the Euler-Lagrange equations
\begin{equation}
\dv{t}\pdv{L}{\dot q^i}(\gamma, \dot \gamma, t) - \pdv{L}{q^i}(\gamma, \dot \gamma, t) = 0, \quad i=1,\ldots n,
\end{equation}
as stated in the theorem, thereby concluding the proof.
\end{proof}
\begin{remark}
In general, the solution $q=q(t)$ of the Euler-Lagrange equations is just a \textbf{critical} point of the $S$ functional, i.e., it satisfies $S[q + \delta q] - S[q] = O(\|\delta q\|^2)$.
It does \textbf{not} have to be a minimum.
However, under some additional conditions it can be proven to be a \emph{local} minimum.
For example, if the matrix of second derivatives
\begin{equation}\label{eq:hsd}
\Lambda := \left( \pdv{L}{\dot q^i}{\dot q^j} \right)_{1\leq i,j\leq n}
\end{equation}
is positive definite.
This case is thoroughly studied in calculus of variation and in some branches of differential geometry.
\end{remark}
\begin{corollary}
If the lagrangian $L$ of a system is \emph{non--degenerate}\index{lagrangian!non-degenerate}, i.e., it satisfies the condition
\begin{equation}
\det \left(\pdv{L}{\dot q^i}{\dot q^j}
\right)_{1\leq i,j\leq n} \neq 0
\end{equation}
then the system satisfies Newton's determinacy principle.
\end{corollary}
\begin{tcolorbox}[title=Einstein's convention]
From now on, we will follow \emphidx{Einstein's convention}, that is, we will omit the summation symbol $\sum$ whenever an index appears twice in an expression.
For example, $y^{ji} x_i \equiv \sum_i y^{ji} x_i$.
\end{tcolorbox}
\begin{proof}
For a non--degenerate lagrangian, a direct computation shows that the Euler-Lagrange equations can be rewritten in the form
\begin{equation}
\ddot q^i = f^i(q,\dot q, t)
:= \Lambda^{ij}\left(\pdv{L}{q^j} - \pdv{L}{\dot q^j}{q^k} \dot q^k - \pdv{L}{\dot q^j}{t}\right),
\quad i=1,\ldots,n.
\end{equation}
Here $\left(\Lambda^{ij}\right) = \left(\Lambda^{ij}(q, \dot q, t)\right)$ are the coefficients of the inverse to the matrix $\Lambda$ from equation \eqref{eq:hsd}, i.e.,
\begin{equation}
\Lambda^{ik} \pdv{L}{\dot q^k}{\dot q^j} = \delta^{i}_{j}.
\end{equation}
\end{proof}
The proof of the corollary above shows that the Euler-Lagrange equations are a system of second order differential equations for the generalized coordinates $q$.
As such, we can use Euler-Lagrange equations as the equations of motion of a mechanical system with non--degenerate lagrangian.
\begin{remark}\label{rmk:manylagrangians}
\index{lagrangian!nonuniqueness}
\emph{The lagrangian of a mechanical system is defined only up to total derivatives}.
That is, the equations of motion remain unchanged if we add a total derivative to the lagrangian function:
\begin{equation}
\widetilde L(q,\dot q, t) = L(q, \dot q, t) + \dv{t} f(q,t).
\end{equation}
Indeed, the action $\widetilde S$ of a system with lagrangian $\widetilde L$ is
\begin{align}
\widetilde S[q] & = \int_{t_1}^{t_2} \widetilde L(q, \dot q, t) \,\dd t \\
& = \int_{t_1}^{t_2} L(q, \dot q, t) \,\dd t + \int_{t_1}^{t_2} \dv{t} f(q,t) \,\dd t \\
& = S[q] + f(q_2, t_2) - f(q_1, t_1).
\end{align}
As the additional $f$-dependent part is constant,
\begin{equation}
\widetilde S[q+\delta q] - \widetilde S[q]
= S[q+\delta q] - S[q]
\end{equation}
and thus the critical points of the two actions are the same.
Similarly, \emph{the lagrangian of a mechanical system does not change if it is multiplied by a constant factor: $\widetilde L = \alpha L$}.
As an aside, quantum mechanical systems no longer remain invariant under the transformations above. Transformations of the first type lead to rather subtle and interesting effects depending on the topology of the state space, while the number $\alpha$ is related to Planck's constant.
\end{remark}
Inn general, physical intuition would suggest that we expect the lagrangian of some system to be constructed composing small subsystems.
When these subsystems are not interacting one would also expect them to be independent from each other.
This idea takes the name of \emphidx{principle of additivity}.
\begin{tcolorbox}[title=Principle of additivity]
Assume that a mechanical system is the combination of two subsystems, say $A$ and $B$.
Let $L_A$ and $L_B$ be their respective lagrangians as if they were isolated (or \emph{closed}) systems.
By moving the two subsystems farther apart from each other, in the limit of infinite distance, the lagrangian of the full system tends to the limit lagrangian
\begin{equation}
L_{\lim} = L_A + L_B.
\end{equation}
\end{tcolorbox}
In more practical terms, this principle is saying that the equations of motion of the system $A$ cannot be dependent on quantities pertaining to $B$ and vice versa.
\subsection{From Lagrange back to Newton}\label{sec:dynamicspps}
Mechanical laws for the same system can look very different from each other, with varying degrees of simplification or complication: think for example as the motion of planets in a geocentric system of coordinates. The planets will start showing all sorts of epicycles and retrograde motions, while in a heliocentric system they will just move in ellipses.
In fact, there is a system of coordinates that simplifies our life the most: the \emph{inertial} coordinate system\index{coordinate system!inertial}.
Sadly, it is not unique, however, the galilean principle of relativity states that all inertial systems are equivalent to each other in a rather specific way.
\begin{tcolorbox}[title=Galilean principle of relativity]
There exist coordinate systems, called inertial, with the following two properties
\begin{enumerate}
\item all the laws of nature at all moments of time are the same in all inertial coordinate systems;
\item all coordinate systems in uniform rectilinear motion with respect to an inertial one are themselves inertial.
\end{enumerate}
\end{tcolorbox}
While the group-theoretical aspects of classical mechanics are deeply connected to our discussion and quite fascinating, we won't explore them further here.
For those intrigued by this topic, we suggest \cite{book:marsdenratiu} as an engaging reference.
For our concerns, an inertial system of coordinates on the galilean space-time is a system of coordinates that can be transformed into the ``standard'' galilean structure $\mathbb{R}\times\mathbb{R}^3$ via a galilean transformation.
If $(t, \vb*{x}) \in \mathbb{R}\times \mathbb{R}^3$ is an element of the ``standard'' galilean space-time, we call \emphidx{galilean transformation}s the transformations $(t,\vb*{x}) \mapsto (\widetilde t, \widetilde{\vb*{x}})$ listed below
\begin{enumerate}
\item translations: $\widetilde t = t + t_0$, $\widetilde{\vb*{x}} = \vb*{x} + \vb*{x}_0$, for $t_0\in\mathbb{R}$, $\vb*{x}_0\in\mathbb{R}^3$;
\item rotations and reflections: $\widetilde t = t$, $\widetilde{\vb*{x}} = G\vb*{x}$ for $G\in O(3)$ a $3\times 3$ orthogonal matrix;
\item uniform motions with velocity $\vb*{v}\in\mathbb{R}^3$: $\widetilde t = t$, $\widetilde{\vb*{x}} = \vb*{x} + \vb*{v} t$.
\end{enumerate}
Then, the galilean principle of relativity implies that the lagrangian of a closed mechanical system is invariant, modulo total derivatives, with respect to the galilean transformations. \medskip
\begin{figure}[ht]
\centering
\includegraphics[width=.85\linewidth]{images/coni-mathyear-21-21.jpg}
\caption{A graphical introduction to Newton's laws of motion,
courtesy of \href{https://web.archive.org/web/20210602092955/https://twitter.com/Coni777/status/1399953219997032448}{Constanza Rojas-Molina}.
If you feel creative, consider contributing to the
\href{http://crojasmolina.com/illustration/the-mathyear-challenge/list-of-prompts-for-mathyear/}{\#mathyear} challenge.}
\end{figure}
We will now see how we can derive Newton's laws from Hamilton's principle as a consequence of the galilean principle of relativity. For an alternative discussion on this topic see \cite[Chapters 1.1 and 1.2]{book:arnold}.
\begin{theorem}
The lagrangian of an isolated point particle in an inertial system of coordinates has the form
\begin{equation}\label{eq:singleptlag}
L(\dot{\vb*{x}}) = \frac{m\,\|\dot{\vb*{x}}\|^2}2
\end{equation}
where $m\in\mathbb{R}$ is a constant called the \emph{mass} of the point particle.
\end{theorem}
\begin{remark}
In view of our previous discussions, the statement above should be read as
\begin{quote}
the lagrangian of an isolated point particle in an inertial system of coordinates has the form~\eqref{eq:singleptlag} up to total derivatives.
\end{quote}
\end{remark}
\begin{proof}
The invariance with respect to translations implies that $L(\vb*{x} + \vb*{x}_0, \dot{\vb*{x}}, t + t_0) = L(\vb*{x}, \dot{\vb*{x}}, t)$, that is, the lagrangian must be independent from $t$ and $\vb*{x}$: the lagrangian $L = L(\dot{\vb*{x}})$ must be a function of the velocity only.
Euler-Lagrange equations~\eqref{eq:eulerlagrange} then imply that either $L$ is the constant function altogether or the velocity must be constant. Indeed, we have
\begin{equation}
0 = \dv{t}\pdv{L}{\dot{\vb*{x}}} - \pdv{L}{\vb*{x}} = \dv{t}\pdv{L}{\dot{\vb*{x}}},
\end{equation}
that is, $\pdv{L}{\dot{\vb*{x}}} = \mathrm{const}$. Since $L$ only depends on the velocity, this means that either $L$ is the constant function, which would make Euler-Lagrange equations completely trivial, or $\dot{\vb*{x}}(t) = \mathrm{const}$.
We just derived an alternative proof of Corollary~\ref{cor:Nfl}, Newton's first law, from the Galilean principle of relativity.
The invariance from orthogonal transformations then implies that $L(\dot{\vb*{x}}) = L(G\dot{\vb*{x}})$, where $G^t G = \Id$. That is, $L$ cannot depend on the direction of the velocity, only on its magnitude:
\begin{equation}
L(\dot{\vb*{x}}) = L(\|\dot{\vb*{x}}\|), \quad \|\dot{\vb*{x}}\|^2 := \langle\dot{\vb*{x}}, \dot{\vb*{x}}\rangle.
\end{equation}
Since we expect the lagrangian to be a smooth function, we want to avoid square roots and therefore we will write
\begin{equation}
L(\dot{\vb*{x}}) = L(\|\dot{\vb*{x}}\|^2).
\end{equation}
The invariance with respect to uniform motion now implies that the lagrangian must actually be proportional to $\|\dot{\vb*{x}}\|^2$.
For convenience, let's first look at the case of small velocities: applying the galilean transformation
\begin{equation}
\vb*{x} \mapsto \vb*{x} + \epsilon \vb*{v}t,
\end{equation}
in the limit $\epsilon \to 0$, we can use a Taylor expansion around $\|\dot{\vb*{x}}\|^2$ to get
\begin{equation}
L(\|\dot{\vb*{x}}\|^2) \mapsto L(\|\dot{\vb*{x}} + \epsilon \vb*{v}t\|^2) = L(\|\dot{\vb*{x}}\|^2) + 2\epsilon\,\langle\vb*{v}, \dot{\vb*{x}}\rangle\,L'(\|\dot{\vb*{x}}\|^2) + O(\epsilon^2).
\end{equation}
Here the $'$ denotes derivation with respect to the only argument of the function $L$.
The invariance of the equations of motion then implies that the linear term in $\epsilon$ should be a total derivative $\dv{t} f(t, \vb*{x}) = 2\,\langle\vb*{v}, \dot{\vb*{x}}\rangle\,L'(\|\dot{\vb*{x}}\|^2)$.
This can happen iff $\pdv{t} f(t, \vb*{x}) = 0$ and $\langle \pdv{f}{\vb*{x}}, \dot x\rangle = 2\,\langle\vb*{v}, \dot{\vb*{x}}\rangle L'(\|\dot{\vb*{x}}\|^2)$ is linear in $\dot{\vb*{x}}$.
In particular, this means that
\begin{equation}
L'(\|\dot{\vb*{x}}\|^2) = \mathrm{const} =: \frac{m}2,
\end{equation}
that is, the lagrangian is of the form \eqref{eq:singleptlag} for some constant value $m\in\mathbb{R}$.
Finally, the lagrangian \eqref{eq:singleptlag} is transformed by a general galilean transformation $\vb*{x} \mapsto \vb*{x} + \vb*{v}t$ into
\begin{equation}
\frac{m \|\dot{\vb*{x}}\|^2}2 \mapsto
\frac{m \|\dot{\vb*{x}}\|^2}2 + m\,\langle\vb*{v},\dot{\vb*{x}}\rangle + \frac{m \vb*{v}^2}2
= \frac{m \|\dot{\vb*{x}}\|^2}2 + \dv{t}\left(m\,\langle\vb*{v},\vb*{x}\rangle + \frac{m \vb*{v}^2 t}2\right),
\end{equation}
and thus the equations of motion remain invariant under the transformation.
\end{proof}
\begin{corollary}[Newton's first law]\label{cor:Nfl}\index{Newton!first law}
In an inertial frame of reference, an isolated point particle either does not move or it is in uniform motion with constant velocity.
\end{corollary}
\begin{proof}
It follows immediately by computing the Euler-Lagrange equations for \eqref{eq:singleptlag}
\begin{equation}
0 = \dv{t} \pdv{L}{\dot x^i} - \pdv{L}{x^i} = m \ddot x^i, \qquad i=1,2,3,
\end{equation}
whose solutions are all of the form $x^i(t) = x^i_0 + v^i_0 t$.
\end{proof}
The additive property of the lagrangians now implies that for a system of $N$ particles which do not interact, the lagrangian is simply the sum
\begin{equation}\label{eq:freel}
L = \sum_{k=1}^N \frac{m_k \|\dot{\vb*{x}}_k\|^2}{2}.
\end{equation}
We call lagrangians of this form \emph{free}\index{lagrangian!free}.
\begin{remark}
A lagrangian can always be multiplied by an arbitrary constant without affecting the equations of motion;
such multiplication then amounts to a change in the unit of mass.
So, the above definition of mass becomes meaningful when we take the additive property into account:
the ratios of the masses remain unchanged and it is only these ratios which are physically meaningful.
\end{remark}
\index{lagrangian!interactions}
To include interactions between the point particles in this formalism, we need to add to the free lagrangian \eqref{eq:freel} a function $-U(\vb*{x}_1, \ldots, \vb*{x}_N)$ which depends on the nature of the interactions:
\begin{equation}\label{eq:mechlag}
L := T-U := \sum_{k=1}^N \frac{m_k \|\dot{\vb*{x}}_k\|^2}{2} -U(\vb*{x}_1, \ldots, \vb*{x}_N).
\end{equation}
The first sum, $T = \sum_{k=1}^N \frac{m_k \|\dot{\vb*{x}}_k\|^2}{2}$, is called \emph{kinetic energy} of the system of particles, while the function $U = U(\vb*{x}_1, \ldots, \vb*{x}_N)$ is called \emph{potential energy}.
Lagrangians of the form $T-U$ are often called \emph{natural}.
\index{lagrangian!natural}\index{energy!potential}\index{energy!kinetic}
\begin{theorem}[Newton's second law]
\index{Newton!second law}
The equations of motion of a system of $N$ point particles with natural lagrangian \eqref{eq:mechlag} are of the form
\begin{equation}\label{eq:newton2}
m_k \ddot{\vb*{x}}_k = \vb*{F}_k, \quad k=1,\ldots,N
\end{equation}
where $\vb*{F}_k (\vb*{x}) = -\pdv{U (\vb*{x})}{\vb*{x}_k}$, $\quad k=1,\ldots,N$.
\end{theorem}
The vector $\vb*{F}_k$ is called the \emphidx{force} acting on the $k$-th point particle. To be more precise, the force is a vector field since $\vb*{F}_k : \vb*{x} \to \vb*{F}_k(\vb*{x})$ maps every point in the configuration space to its own vector.
\begin{exercise}\label{ex:N3l1}\index{Newton!third law}
Prove \emph{Newton's third law}, i.e., for each of the $k$ point particles it holds
\begin{equation}
\vb*{F}_k = -\sum_{j\neq k} \vb*{F}_j.
\end{equation}
\textit{Hint: use the invariance with respect to spatial translations or sneak peek forward to the conservation of total momentum.}
\end{exercise}
\begin{remark}
\begin{enumerate}
\item Mechanical systems are time-\emph{reversible}: they are also invariant with respect to the transformation $t\mapsto -t$.
\item If you consider systems in interaction with the environment, you may end up with lagrangians that are no longer invariant with respect to galilean transformations and can explicitly depend on time.
\end{enumerate}
\end{remark}
\begin{example}[Free fall]
Consider the vertical motion of a point particle of mass $m$ in the external field with potential $U(z) = m g z$, see also Example~\ref{ex:sprPen}. The natural lagrangian of the system is
\begin{equation}
L = \frac{m\dot z^2}2 - mgz,
\end{equation}
which corresponds to the equation of motion $\ddot z = -g$: this is the equation of motion of a point particle in free fall towards Earth. In agreement with Galileo's law, the acceleration is constant and does not depend on the mass.
\end{example}
\begin{example}\label{ex:kepler1}
The motion of $N$ point particles with masses $m_1, \ldots, m_N$ in their gravitational field, is described by the lagrangian
\begin{equation}
L = \sum\frac{m_k \|\dot{\vb*{x}}_k\|^2}{2} + \sum_{k < l} G \frac{m_k m_l}{\|\vb*{x}_k - \vb*{x}_l\|},
\end{equation}
where $G$ is the gravitational constant.
To study the \emph{approximate} description of the motion of a planet of mass $m$ around the Sun, which has mass $M \gg m$, one can assume the effects of the planet on the Sun to be negligible and ignore the interaction with the other planets.
In such a case, the motion of the planet is described by the lagrangian of a point particle with a Newtonian gravitational potential
\begin{equation}
L = \frac{m\|\dot{\vb*{x}}\|^2}{2} + \frac{G M m}{\|\vb*{x}\|},
\end{equation}
whose equation of motion should remind you of \eqref{eq:keplerex} from Example~\ref{ex:Kepler0}.
\end{example}
\index{energy!kinetic}
To understand better why $T$ in \eqref{eq:mechlag} is called kinetic energy, it is useful to look at its relation with Newton's second law \eqref{eq:newton2}:
\begin{equation}
\dv{t} T
= m \langle\dot{\vb*{x}}(t), \ddot{\vb*{x}}(t)\rangle
= \left\langle\dot{\vb*{x}}(t), \vb*{F}(\vb*{x}(t))\right\rangle.
\end{equation}
This confirms the intuitive notion that the kinetic energy should increase if a force pushes the particle in the direction of the current motion and should decrease when it pulls the particle in the opposite direction.
There is more, in fact our computation above shows that
\begin{equation}
T(t_1) - T(t_0) = \int_{t_0}^{t_1} \left\langle\dot{\vb*{x}}(t), \vb*{F}(\vb*{x}(t))\right\rangle\; \dd t = \int_{\vb*{x}_0}^{\vb*{x}_1} \left\langle\vb*{F}(\vb*{x}), \dd{\vb*{x}}\right\rangle,
\end{equation}
where $\vb*{x}_i := \vb*{x}(t_i)$.
This is equivalent to say that the change of kinetic energy is equal to the \emph{work}\index{work done by a force} done by the force, i.e., the integral of $\vb*{F}$ along the curve $\vb*{x}(t)|_{t\in[t_0, t_1]}$. The name comes from the fact that, physically, you can think of $F(\vb*{x}) \cdot \dd{\vb*{x}}$ as the infinitesimal contribution of the vector field to the acceleration.
\begin{remark}
For $N=1$, Stokes' theorem implies that the integral above is independent of the path between $\vb*{x}_0 = \vb*{x}(t_0)$ and $\vb*{x}_1 = \vb*{x}(t_1)$ if and only if $\curl \vb*{F} = 0$, which in turn is true if and only if there exists a function $U:\mathbb{R}^3\to\mathbb{R}$ such that $\vb*{F} = -\frac{\partial U}{\partial \vb*{x}}$.
%
In fact, this is true in any dimension by using the general version of Stokes' theorem: the work done by the force depends only on the endpoints of the integral if and only if there is $U:\mathbb{R}^n\to\mathbb{R}$, unique up to an additive constant, such that $\vb*{F} = -\frac{\partial U}{\partial \vb*{x}}$.
%
You can read more about this in \cite[Chapter 2.5]{book:arnold} and \cite[Theorem 6.3 and 8.1]{book:knauf}.
\end{remark}
\begin{remark}
Often in physics, the kinetic energy is instead defined as \emph{the work required to bring the mass from rest to some speed~$\dot{\vb{x}}$}.
One can then perform the computation above backwards
\begin{align}
\int_{x_0}^{x^1} \left\langle\vb*{F}(\vb*{x}), \dd{\vb*{x}}\right\rangle
&= \int_{t_0}^{t_1} \left\langle\dot{\vb*{x}}(t), \vb*{F}(\vb*{x}(t))\right\rangle\; \dd t \\
&= \int_{t_0}^{t_1} m \langle\dot{\vb*{x}}(t), \ddot{\vb*{x}}(t)\rangle\; \dd t
= \int_{t_0}^{t_1} \dv{t} \frac{m}{2} \langle\dot{\vb*{x}}(t), \dot{\vb*{x}}(t)\rangle \; \dd t,
\end{align},
leading to the definition of kinetic energy as $T = \frac{m}{2} \|\dot{\vb{x}}\|^2$.
\end{remark}
Forces that can be written in the form $\vb*{F} = -\frac{\partial U}{\partial \vb*{x}}$, for some function $U$, are called \emph{conservative}.\index{force!conservative}
We will understand better why in a couple of sections.
Not all the forces in nature are conservative, and in that case the results of this section do not directly apply.
We don't have to go very far to see an example of this, but we can also see that the lagrangian approach can be easily extended to include non-conservative forces.
\begin{example}\label{exa:magnetic}\index{magnetic!field}\index{magentic!vector potential}
Mechanical systems affected by an external magnetic field $\vb* B$ can be described in the lagrangian formalism by adding a linear term in the velocities to a natural lagrangian \eqref{eq:mechlag}:
\begin{equation}\label{eq:magLag}
\widetilde L = L + \frac ec \sum_{k=1}^N \langle\vb* A(\vb*{x}_k), \dot{\vb*{x}}_k\rangle.
\end{equation}
Here the constant $e$ is the electric charge of the point particles and $c$ is the speed of light in vacuum.
The magnetic field is given by $\vb* B = \curl \vb* A$, the vector field $\vb* A$ is called magnetic vector potential.
We will not see this in the course, but magnetic phenomenons have a natural description only in the relativistic approach. We see a hint of this fact here, in that \eqref{eq:magLag} is not invariant with respect to the galilean transformations.
\begin{exercise}\label{exe:magnetic}
Show that the equations of motion \eqref{eq:newton2} corresponding to a magnetic lagrangian \eqref{eq:magLag} are given by
\begin{equation}
m_k \ddot{\vb*{x}}_k = \vb*{F}_k + \frac ec \dot{\vb*{x}}_k \times \vb* B(\vb*{x}_k)
\end{equation}
where $\times$ denotes the usual vector product in $\mathbb{R}^3$ and, as mentioned above, $\vb* B = \curl \vb* A$ is the magnetic field.
The additional term $\frac ec \dot{\vb*{x}}_k\times \vb* B(\vb*{x}_k)$ is the \emphidx{Lorentz force} acting on the $k$th particle of charge $e$ immersed in the magnetic field $\vb* B$. By definition, the Lorenz force is orthogonal to the velocity of the particle and to the magnetic field and thus tends to curve the trajectory of the particle.
\warpHTMLonly{<p><iframe scrolling=no title=The Lorentz force src=https://www.geogebra.org/material/iframe/id/axnqyhdx/width/1100/height/800/border/888888/sfsb/true/smb/false/stb/false/stbh/false/ai/false/asb/false/sri/true/rc/false/ld/false/sdz/false/ctl/false width=1100px height=800px style=border:0px;> </iframe></p>
<p>In the simulation above you can see how the Lorentz force can affect a charged particle motion in a uniform magnetic field. For an easy comparison two different particles are shown, with independent parameters but immersed in the same magnetic field. The value $q = e/c$ corresponds to the charge of the particle. The standalone version of this applet is <a href=https://www.geogebra.org/m/tvbfjfct>available on geogebra</a> and was derived from an <a href=https://www.geogebra.org/m/xpRMzPgc>applet by Luca Moroni</a>.</p>}
For a beautiful geometric discussion of this problem, you can refer to \cite[Chapter 8.3 (9.3 in more recent editions)]{book:amr}.
\end{exercise}
Note that the magnetic vector potential is not unique!
For any function $f$, the transformation
\begin{equation}
\vb* A \mapsto \vb* A + \pdv{f}{\vb*{x}}
\end{equation}
will produce the same field.
This is known as \emphidx{gauge transformation}.
Under this transformation the lagrangian is transformed as
\begin{equation}
\widetilde L \mapsto \widetilde L + \frac{e}{c} \dv{f}{t}
\end{equation}
but we know that the equations of motion remain invariant under the addition of a total derivative to the Lagrangian.
The concept of gauge invariance is central in many problems of modern physics.
\end{example}
\section{First steps with conserved quantities}
\subsection{One degree of freedom}\label{sec:bdf}
Consider the one dimensional Newton's equation for a point particle with unit mass and position $x(t)$:
\begin{equation}\label{eq:oscillator}
\ddot x = F(x), \qquad F:\mathbb{R}\to\mathbb{R}, \quad t\in \mathbb{R}.
\end{equation}
Introducing the auxiliary variable $y(t) = \dot x(t)$, \eqref{eq:oscillator} is equivalent to the system of first order equations
\begin{equation}\label{eq:oscillatorfirstorder}
\left\lbrace
\begin{aligned}
\dot x & = y \\
\dot y & = F(x)
\end{aligned}
\right..
\end{equation}
The solutions of \eqref{eq:oscillatorfirstorder} are parametric curves $(x(t),y(t)):\mathbb{R}\to\mathbb{R}^2$ in the $(x,y)$-space.
These curves are often called \emphidx{trajectories} of the system or \emph{integral curves} of the ordinary differential equation.
If $y\neq0$, we can apply the chain rule, $\dv{y}{t} = \dv{y}{x} \dv{x}{t}$, to get
\begin{equation}\label{eq:lef}
\frac{F(x)}y = \frac{\dot y}{\dot x} = \dv{y}{x}.
\end{equation}
What is important here, is that this new equation does not depend on time. Although eliminating time and considering \eqref{eq:lef} comes at a cost -- the solution is now an implicit curve $y(x)$ -- it also presents a substantial benefit: this new equation can be solved exactly!
How is that so? After a bit of algebra and integrating both sides with respect to $x$, we can rewrite this as
\begin{align}
&\int y\,\dv{y}{x}\dd x - \int F(x)\, \dd x \notag \\
& = \int y\,\dd y - \int F(x)\, \dd x = 0 \label{eq:pp-notime-int}
\end{align}
Integrating the integral on the left, we get
\begin{equation}
\frac12 y^2 + C_y = \int F(x) dx.
\end{equation}
%
\begin{remark}
This identity in \eqref{eq:pp-notime-int} is often expressed as
\begin{equation}
y\,\dd y - F(x)\, \dd x = 0.
\end{equation}
This may look like a formal manipulation, but it is actually a rigorous identity in terms of differential forms.
To know more, you can refer to \cite[Equation (5.1) with $f=y$ and Remark 5.1.3]{lectures:aom:seri} or any good textbook on differential forms.
For simplicity, we will limit ourselves to the formal manipulation.
\end{remark}
%
If $U(x)$ is such that $F(x) = -\dv{U}{x}$, we can further simplify the equation into
\begin{equation}\label{eq:pp-energy}
\frac12 y^2 = -U(x) + C,
\end{equation}
where $C = C_x - C_y \in\mathbb{R}$ is just a number due to the constants of integration. Varying $C$, \eqref{eq:pp-energy} describes a family of curves in the $(x,y)$-plane which correspond to different solutions of our original problem.
We can also locally invert the equation above to get the explicit solution
\begin{equation}
y(x) = \pm \sqrt{2(C-U(x))}.
\end{equation}
Equation \eqref{eq:pp-energy} may already be familiar: $\frac12 y^2 + U(x)$ is the sum of the kinetic energy $\frac12 y^2 = \frac12 {\dot x}^2$ of the particle and its potential energy $U$. In fact, the statement above is a theorem and we can prove it without the need of the formal step with the differentials.
\begin{theorem}\label{thm:ham1}
Let $H(x, y) := \frac12 y^2 + U(x)$ where $U:\mathbb{R}\to\mathbb{R}$ is such that $F(x) = -\dv{U}{x}$.
Then, the connected components of the level curves $H(x,y) = C$ are the integral curves of \eqref{eq:oscillatorfirstorder}.
\end{theorem}
The function $H$ introduced in Theorem~\ref{thm:ham1} is called the \emph{total energy}\index{energy} of the mechanical system.
\begin{proof}
The proof is surprisingly simple:
\begin{align}
\dot H & = \frac{\partial H}{\partial x}\dv{x}{t} + \frac{\partial H}{\partial y}\dv{y}{t} \\
& = \dv{U}{x} y + y F(x)
= -y F(x) + y F(x) = 0.
\end{align}
\end{proof}
The fact that $H(x,y)$ remains constant on the trajectories is crucial: when this happens we say that the total energy of the system is a \emph{conserved quantity}\index{energy!conservation (1d)}.
A curve $(x(t), y(t))$ spanned by a solution of \eqref{eq:oscillatorfirstorder} is called a \emphidx{phase curve}.
\begin{figure}[htbp]
\centering
\includegraphics[width=.7\linewidth]{images/potential-curves-pendulum.pdf}
\caption{Integral curves for the pendulum}
\label{fig:pendulum}
\end{figure}