
\documentclass[12pt, a4paper]{amsart}


\usepackage{amsmath,amssymb,amscd,amsfonts}
\newtheorem{thm}{Theorem}[subsection]
\newtheorem{lem}[thm]{Lemma}
\newtheorem{rem}[thm]{Remark}
\newtheorem{prop}[thm]{Proposition}
\newtheorem{cor}[thm]{Corollary}
\newtheorem{defn}[thm]{Definition}
\newtheorem{assu}[thm]{Assumption}
\newtheorem{claim}[thm]{Claim}
\newtheorem{ex}[thm]{Example}
\newtheorem{exer}[thm]{Exercise}

\newcommand\delbar{\overline{\partial}}
\newcommand\PIC{{\text{\rm Pic}}(X)}
\newcommand\Pic{{\text{\rm Pic}}}
\newcommand\Ram{{\text{\rm Ram}}}
\newcommand\dimm{{\text{\rm dim}}}
\newcommand\rank{{\text{\rm rank}}}
\newcommand\rk{{\text{\rm rank}}}
\newcommand\codim{{\text{\rm codim}}}
\newcommand\dg{{\text{\rm deg}}}
\newcommand\PX{{\text {\rm Pic}}^0(X)}
\newcommand\PXT{{\text {\rm Pic}}^{\tau }(X)}
\newcommand\DI{{\text {\rm dim}}   }
\newcommand\DX{{\text {\rm dim}}(X)}
\newcommand\DY{{\text {\rm dim}}(Y)}
\newcommand\PA{{\text {\rm Pic}}^0(A)}
\newcommand\ALB{{\text{\rm Alb}}(X)}
\newcommand\alb{\text{\rm a}}
\newcommand\id{\text{\bf 1}}
\newcommand\al{{\alpha}}
\newcommand\bb{{\beta}}
\newcommand\Alb{\text{\rm Alb}}
\newcommand\Aut{\text{\rm Aut}}
\newcommand\gal{\text{\rm Gal}}
\newcommand\chr{\text{\rm char}}
\newcommand\Hom{\text{\rm Hom}}
%\newcommand\ker{\text{\rm ker}}
\newcommand\im{\text{\rm im}}
\newcommand\coker{\text{\rm coker}}
\newcommand\lra{\longrightarrow}
\newcommand\ot{{\otimes}}
\newcommand\OO{{\mathcal{O}}}
\newcommand\OY{{{\OO _Y}}}
\newcommand\OX{{{\OO _X}}}
\newcommand\OZ{{{\OO _Z}}}
\newcommand\PPP{{\mathcal{P}}}
\newcommand\PP{{\mathbb{P}}}
\newcommand\ox{{\omega _X}}
\newcommand\EE{{\mathcal{E}}}
\newcommand\FF{{\mathcal{F}}}
\newcommand\F{{\mathcal{F}}}
\newcommand\inv{{^{-1}}}
\newcommand\dual{{^{\vee }}}
\newcommand\ddual{{^{\vee \vee}}}
\newcommand\HH{{\mathcal{H}}}
\newcommand\GG{{\mathcal{G}}}
\newcommand\BB{\mathcal{B}}
\newcommand\LL{\mathcal{P}}
\newcommand\KK{{\mathcal{K}}}
\newcommand\QQ{{\mathcal{Q}}}

\newcommand\Q{{\mathbb{Q}}}
\newcommand\CC{{\mathbb{C}}}
\newcommand\AAA{{\mathbb{A}}}
\newcommand\ZZ{{\mathbb{Z}}}
\newcommand\RR{{\mathbb{R}}}
\newcommand\III{{\mathcal{I}}}
\newcommand\JJJ{{\mathcal{JJJ}}}
\newcommand\sh{{\hat {\mathcal S}}}
\newcommand\s{{ {\mathcal S}}}

\newcommand\cA{{\mathcal{A}}}
\newcommand\cB{{\mathcal{B}}}
\newcommand\cC{{\mathcal{C}}}
\newcommand\cD{{\mathcal{D}}}
\newcommand\cE{{\mathcal{E}}}
\newcommand\cF{{\mathcal{F}}}
\newcommand\cG{{\mathcal{G}}}
\newcommand\cH{{\mathcal{H}}}
\newcommand\cI{{\mathcal{I}}}

\newcommand\bR{{\mathbb R}}
\newcommand\bZ{{\mathbb Z}}
\newcommand\bC{{\mathbb C}}
\newcommand\bQ{{\mathbb Q}}
\newcommand\bN{{\mathbb N}}
\newcommand\bA{{\mathbb A}}
\newcommand\bP{{\mathbb P}}
\newcommand\bF{{\mathbb F}}

\newcommand\mb[1]{{{\mathbb{{#1}}}}}
\newcommand\mc[1]{{{\mathcal{{#1}}}}}
\newcommand\f[1]{{{\frak{{#1}}}}}
\newcommand\cx[1]{{{#1}^\bullet}}

%%%%%%%%%%%%%%%%%%%%%%%%%
%%%%%%%%%%%%%%%%%%%%%%%%%
\begin{document}

\begin{center}
{\Large Advanced Algebra I}\\
 Sep. 22, 2006 (Fri.)
\end{center}

\section{Set Theory}

We recall some set theory that will be frequently used in the
sequel or that is not covered in the basic college course.
However, we will keep this chapter as minimum as possible.

We assume the notion of "set" and some basic operation of sets
without bothering their definition.

\subsection{Zorn's Lemma}
\begin{defn}
A set  $S$ is said to be {\bf partially ordered} if there is a
relation $\le$  such that
\begin{enumerate}
\item (reflexive) $x \le x$

\item (anti-symmetric) if $x \le y$ and $y \le x$, then $x=y$.

\item (transitive) if $x \le y$ and $y \le z$ then  $ x \le z$.
\end{enumerate}

We usually call a partially ordered set to be a POSET.
\end{defn}

\begin{defn}
A pair of elements in an POSET is said to be {\bf comparable} if
either $x \le y$ or $y \le x$. A set is said to be {\bf totally
ordered} (or linearly ordered) if every pair is comparable.
\end{defn}

We also need the following definition:

\begin{defn}
A maximal element of an poset $S$ is an element $m \in S$ such
that if $m \le x$ then $m=x$.\\

Foe a given subset $T \subset S$, an upper bound of $T$ is an
element $b \in S$ such that $x \le b$ for all $x \in T$.
\end{defn}

One has the following

\begin{thm}[Zorn's lemma]
Let $S$ be a non-empty  poset. If every non-empty totally ordered
subset (usually called a "chain") has an upper bound, then there
exists a maximal element in $S$.
\end{thm}

Zorn's Lemma could be taken as an axiom of set theory. It can be
proved to be equivalent with the Axiom of Choice. It's also
equivalent to the  Well-ordering Principle. We simply give the
statement of these. The reader can find the proof in most of the
books on set theory.

An ordered set is said to be well-ordered if it is totally ordered
and  every non-empty subset $B$ has a least element, i.e. an
element $a \in B$ such that $a \le x$ for all $x \in B$.

\begin{thm} [Well-ordered Principle]
Every non-empty set can be well-ordered.
\end{thm}

One might wondering that $(\bQ, \le)$ equipped with the usual
ordering is not well-ordered. So the statement says that there is
another ordering which make the set $\bQ$ well-ordered.

\begin{ex}
Let $R$ be a non-zero commutative ring. One can prove that there
exists a maximal ideal by using Zorn's lemma. The proof goes as
following: Let $S=\{ I \lhd R| I \ne R\}$ equipped with the
$\subset$ as the partial ordering. $S \ne \emptyset $ because $0
\in S$. For a chain $\{I_j\}_{j \in J}$, one has a upper bound
$I=\cup I_j$. Then we have a maximal element in $S$ by Zorn's
lemma. One can easily show that the maximal element corresponds to
a maximal ideal.
\end{ex}

\subsection{cardinality}
In order to compare the "size of sets", we introduce the
cardinality.

\begin{defn}
Two sets $A,B$ are said to have the same cardinality if there is a
bijection between them, denoted $|A|=|B|$.\\ And we say $|A| \le
|B|$ if there is a injection from $A$ to $B$.
\end{defn}

It's easy to see that the cardinality has the properties that $|A|
\le |A|$ and if $|A| \le |B|, |B| \le |C|$, then $|A| \le |C|$. So
It's likely that the "cardinality are partially ordered" or even
totally ordered.

\begin{lem} \label{exer1}
Given two set $A,B$, either $|A| \le |B|$ or $|B| \le |A|$.
\end{lem}
\begin{proof}[Sketch]
Consider $$S=\{ (C,f)| C \subset A, f: C \to B \text{ is an
injection} \}.$$ Apply Zorn's lemma to $S$, one has an maximal
element $(D,g)$, then one claim that either $D=A$ or $im(g)=B$. \\
We leave it as an exercise for the readers.
\end{proof}

\begin{thm}[Schroeder-Bernstein]
If $|A| \le |B|$ and $|B| \le |A|$, then $|A|=|B|$.
\end{thm}

\begin{proof}[Sketch]
Let $f: A \to B$ (resp. $g: B \to A$) be the given injections
respectively. One needs to construct a bijection by using $f$ and
$g$.

Some parts of $A$ use $f$ and some parts not. So we consider the
partition
$$ A_1:=\{a \in A| a \text{ has parentless ancestor in } A \},$$
$$ A_2:=\{a \in A| a \text{ has parentless ancestor in } B \},$$
$$ A_3:=\{a \in A| a \text{ has infinite ancestor} \}.$$
And so does $B$.

Then we claim that $f$ restricted to $A_1,A_3$ are bijections to
$B_1,B_3$. And $g$ restricted to $B_2,B_3$ are bijections to $A_2,
A_3$. So the desired bijection can be constructed.
 \end{proof}

We need some more properties of cardinality. If
$|A|=|\{1,..,n\}|$, then we write $|A|=n$. And if
$|A|=|\mathbb{N}|$ then we write $|A|=\aleph_0$.

\begin{prop}\label{infiniteN}
If $A$ is infinite, then $\aleph_0 \le |A|$.
\end{prop}
\begin{proof}[Sketch]
By Axiom of Choice.
\end{proof}

\begin{defn}
$$ |A|+|B|:=|A \amalg B|,$$
$$ |A| \cdot |B| := |A \times B|.$$
\end{defn}

We have the following properties:
\begin{prop}
\noindent
\begin{enumerate}
\item If $|A|$ is infinite and $|B|$ is finite, then $|A+B|=|A|$.

\item If $|B| \le |A|$ and $|A|$ is infinite, then $|A+B|=|A|$.

\item If $|B| \le |A|$ and $|A|$ is infinite, then $|A \times
B|=|A|$.
\end{enumerate}
\end{prop}

\begin{proof}
For (1), take a countable subset $A_0$ in $A$ by Proposition
\ref{infiniteN}. One sees that $|A_0|=|A_0|+|B|$ by shifting the
index by $|B|$. Then we have $$ |A|=|A-A_0|+|A_0| =
|A-A_0|+|A_0|+|B|= |A|+|B|.$$

For (2), it's enough to see that $|A+A| \le |A|$ since clearly
$$|A| \le |A+B| \le |A+A|.$$ Pick an maximal subset $X \subset A$
having the property that $|X+X| \le |X|$ by Zorn's Lemma. One
claim that $A-X$ is finite, and then we are done by (1).

To see the claim, if $A-X$ is infinite, then there is a countable
subset $A_0 \subset A-X$. One can construct an injective function
$A \amalg X \amalg A \amalg X \to A \amalg X$ which contradicts to
the maximality of $X$.

For (3), it suffices to show that $|A \times A|=|A|$. We sketch
the proof. Let $$S=\{ (B,f)| B \text{ is an infinite subset of }A,
f: B \to B \times B \text{ an bijection}\}.$$ $S$ is non-empty
because $S$ contains an infinite countable subset. $S$ can be
equipped with natural partial ordering and by Zorn's Lemma, there
exists a maximal element, say $(M,g)$.

Let $C$ be the complement of $M$ in $A$. If $|C|\le |M|$, then by
$(2)$, $|A|=|M|$. Hence there is a bijection $h: A \to M$. It
follows that  there is a bijection $A \stackrel{h}{\to} M
\stackrel{G}{\to} M \times M
\stackrel{(h^{-1},h^{-1})}{\longrightarrow} A \times A$.

Finally, if $|C| \ge |M|$, then there is a subset $M_1 \in C$ such
that $|M_1|=|M|$. Let $M'=M \cup M_1$. One can construct a
bijection from $M' \to M' \times M'$. This contradicts to the
maximality of $M$. Hence we are done.
\end{proof}

\pagebreak

\begin{center}
 Sep. 22, 2006 (Fri.)
\end{center}

\section{Group Theory}
The concept of groups is a very fundamental one in Mathematics. It
arise as automorphism of certain sets. For example, some geometry
can be described as the groups acting on the geometric objects.

In the first section, we are going to recall some definition and
basic properties of groups in general. In the second section, we
introduce the acting of groups. The groups action can find many
applications in geometry, algebra, and  the theory of groups
itself. In the third section, we are would like to take care of
various aspects of reducing or factoring groups into simple ones.

\subsection{Basic group theory}
\begin{defn}
A group $G$ is a set together with a binary operation $\circ: G
\times G \to G$ satisfying:
\begin{enumerate}
\item there is an $e \in G$ such that $e \circ g =g\circ e =g$ for
all $g\in G$.

\item  for all $g \in G$, there is an $g^{-1} \in G$ such that
$g\circ g^{-1} = g^{-1}\circ g = e$

\item for all $g_1,g_2,g_3 \in G$, we have $(g_1\circ g_2)\circ
g_3 = g_1\circ( g_2\circ g_3)$.
\end{enumerate}
A group is said to be {\bf abelian} if $x\circ y=y\circ x$ for all
$x,y\in G$.
\end{defn}

For simplicity, we will denote $xy$ for $x \circ y$.\\

A subset $H \subset G$ is a {\bf subgroup} if $H$ is a group by
using the binary operation of $G$, denoted $H< G$.\\

A {\bf group homomorphism} $f : G \to H$ is a function between
groups that respects the structure of groups. That is, a function
satisfying $f(xy) = f(x) f(y)$.\\
The {\bf kernel} of $f$, denote $\ker(f)$, is defined to be $\{ x
\in G | f(x) =e_H\}$.\\

A subgroup $H <G$ is said to be {\bf normal} if $gHg^{-1} =H$ for
all $g \in G$, denoted $H \lhd G$. Given a subgroup $H< G$, we
note $G/H$ the set of left cosets, i.e. $G/H =\{ gH | g \in G\}$.
When $H \lhd G$ is normal, then $G/H$ has induced group structure
given by $ xH \circ yH := xyH$. This is called the quotient group.

We remark that a subgroup is normal if and only if it is the
kernel of some homomorphism. The following lemma is useful

\begin{lem}\label{inkernel}
Let $f: G \to H$ be a group homomorphism. Let $N$ be a normal
subgroup of $G$ contained in $\ker (f)$, then there is an induced
homomorphism $\bar{f}: G/N \to H$.
\end{lem}

\begin{proof}
Define $\bar{f}: G/N \to H$ by $\bar{f}(gN)= f(g)$. Then it's
routine to verify it's well-defined and it's a group homomorphism.
\end{proof}

Regarding group homomorphisms, there are some useful facts:
\begin{thm} [First isomorphism theorem] \label{1isothm}
Let $f: G \to H$ be a group homomorphism, then there is an induced
isomorphism $\bar{f}: G/\ker(f) \cong im(f)$.\\
In particular, if $f$ is surjective, then $\bar{f}: G/ \ker(f)
\cong H$.
\end{thm}
\begin{proof}
Define $\bar{f}: G/\ker(f) \to H$ by $\bar{f}(g\ker(f))= f(g)$.
Then it's routine to verify it's well-defined and it's a injective
group homomorphism.
\end{proof}

\begin{ex}
Let $G$ be the set of all maps $T_{a,b}: \bR \to \bR$ such that
$T_{a,b}(x)=ax+b$ with $a \ne 0$. Then $G$ is a group under
composition. There are two natural subgroups:\\
$A:=\{ T_{a,0} \} \cong \bR^*$, the multiplication group.\\
$N:=\{ T_{1,b} \} \cong \bR$, the translation group.\\
There is a group homomorphism $f: G \to \bR^*$ by $f(T_{a,b})=a$.
Its kernel is $N$, which is a normal subgroup of $G$. So we have $
G/N \cong A$. \\
Moreover, $G=NA=AN$ and $N\cap A = \{e\}$. So in fact $G$ is the
{\bf semidirect product} of $A$ and $N$.
\end{ex}

\begin{thm} [Second isomorphism theorem] \label{2isothm}
Let $H,K$ be subgroups of $G$. Then we have group isomorphism
$$ H/(H \cap K) \cong HK/ K,$$
when\\
1. $H < N_G(K)$ or especially, \\
2. $K \lhd G$.
\end{thm}

\begin{proof}[Sketch]
Recall that $N_G(K):=\{x \in G| xKx^{-1}=K\}$ denotes the
normalizer of $K$ in $G$. It is the maximal subgroup of $G$ in
which $K$ is normal. In particular $K \lhd N_G(K)$. So $K \lhd G$ if and only if $G= N_G(K)$.\\

Also one can check that if $H < N_G(K)$, then $HK=KH < N_G(K)$ is
a subgroup of $G$. Moreover, $K \lhd HK$.\\

On the other hand, if $H < N_G(K)$, then $H \cap K \lhd H$. Thus
both sides are groups. \\

Finally, we consider $f: H \to HK/K$ by $f(h)=hK$. It's easy to
check that $f$ is surjective with kernel $H \cap K$. By first
isomorphism theorem, we proved (1). And (2) is just a special case
of (1).
\end{proof}

Given a surjective homomorphism $f: G \to H$, by First isomorphism
theorem, $H \cong G/N$ where $N=\ker(f)$ is a normal subgroup.
It's natural to study the group structures between them. It's easy
to see that there is a map
$$ \{ K < G/N \} \stackrel{f^{-1}}{\to} \{L < G| N < L\}.$$
In fact, this map is bijective. Moreover, it sends normal
subgroups to normal subgroups.

\begin{thm}[Third isomorphism theorem] \label{3isothm}
Given $N \lhd G$ and $K \lhd G$ containing $N$. Then $K/N \lhd
G/N$. Moreover, $(G/N)/(K/N) \cong G/K$.
\end{thm}

\begin{proof}[Sketch]
It's easy to check that $K/N \lhd G/N$ by definition.\\
In fact, we consider $f:G \to G/K$. Since $N \lhd G $ and $N$ is
contained in $\ker(F) =K$, by Lemma \ref{inkernel}, we have an
induced map $\bar{f}: G/N \to G/K$ which is clearly surjective.
One checks that $\ker(\bar{g})= K/N$ and we are done by Themreom
\ref{1isothm}.
\end{proof}

\subsection{cyclic groups}
\noindent \\ Among all groups, perhaps simplest ones are cyclic
groups. Let $G$ be a group. We say that $G$ is cyclic if there is
an element $x\in G$ such that every element $g \in G$ can be
written as $x^n$ for some $n \in \bZ$.

It's clear that $\bZ$ under addition is a cyclic group. By the
definition, given a cyclic group $G$, there is a surjective map
$f: \bZ \to G$, by $n \mapsto x^n$. This is indeed a group
homomorphism. Therefore, by Theorem \ref{1isothm}, $G \cong \bZ /
\ker(f)$.

The reader should find no difficulty showing that subgroups of
$\bZ$ is either $\{0\}$ or of the form $n \bZ$. Since $\bZ$ is
abelian, every subgroup is normal.

Turning back to the discussion of cyclic groups. There are two
cases:\\
1. $\ker(f)=0$. Then $G \cong \bZ$. This is called an infinite
cyclic group.\\
2. $\ker(f)=n \bZ$. Then $G \cong \bZ / n \bZ$. This is called a
cyclic group of order $n$, denoted  $\bZ_n$.

There list  some properties and leave the proof for the readers.
\begin{prop} Let $G$ be a cyclic group.\\
\noindent 1. Every subgroup is cyclic. \\
2. Homomorphic image of $G$ is cyclic.\\
3. If $G$ is a cyclic group of order $n$, for all $d|n$ there
exist a subgroup of order $d$. \\
4. If $G$ is a cyclic group of order $n$ with a generator $x$,
then the set of generators consist of $\{x^t | (t,n)=1 \}$.
\end{prop}

\vfill
 \pagebreak
\begin{center}
 Sep. 29, 2006 (Fri.)
\end{center}



\subsection{group action}
\noindent \\
Group action is one of the most fundamental concept in group
theory. There are many situations that group actions appear
naturally. The purpose of this section is to develop basic
language of group action and apply this to the study of abstract
groups.

 We will first define the group action and illustrate some
previous known theorem as examples.

\begin{defn}
We say a group $G$ acts on a set $S$, or $S$ is a $G$-set, if
there is function $\alpha: G \times S \to S$, usually denoted
$\alpha(g,x)=gx$, compatible with group structure, i.e.
satisfying:
\begin{enumerate}
\item let $e \in G$ be the idetity, then $ex=x$  for all $x\in S$.
\item $g(hx)=(gh)x$ for all $g,h \in G$, $x\in S$.
\end{enumerate}
\end{defn}


By the definition, it's clear to see that if $y=gx$, then
$x=g^{-1}y$. Because $ x=ex=(g^{-1}g)x=g^{-1}(gx)=g^{-1}y$.

Moreover, one can see that given a group action $\alpha: G \times
S \to S$ is equivalent to have a group homomorphism
$\tilde{\alpha}: G \to A(S)$, where $A(S)$ denote the group of
bijections on $S$.

\begin{exer}
There is a bijection between $\{ \text{group action of } G \text{
on } S \}$ with $\{ \text{group homomorphism } G \to A(S)\}$.
\end{exer}

\begin{ex} [Cayley's Theorem]\end{ex}
Let $G$ be a finite group of $|G|=n$. Then there is an injective
homomorphism $G \to S_n$.\\

To see this, we consider $G$ acts on $G$ via the group operation,
i.e. $G \times G \to G$. Thus we have a homomorphism $\varphi: G
\to
A(G)$.\\

It's clear that $A(G) = S_n$. It's easy to see that $\varphi$ is
injective. \qed

This give an example of "permutation representation". That is,
represent a group into permutation groups. We gave another
example:

\begin{ex}
\end{ex}
Let $\bF_2$ be the field of 2 elements. We would like to see that
$GL(2, \bF_2) \cong S_3$.

We consider $V$ the $2$ dimensional vector space over $\bF_2$.
There are $3$ non-zero vector in $V$, denoted, $W:=\{v_1:=e_1,
v_2:=e_2, v_3:=e_1+e_2\}$. It's clear that $GL(2, \bF_2)$ acts on
$W$. Thus we have a representation $GL(2, \bF_2) \to A(W) \cong
S_3$. One can check that this is indeed an isomorphism. \qed

We now introduce two important notions:
\begin{defn}
Suppose $G$ acts on $S$. For $x\in S$, the {\bf orbit} of $x$ is
defined as $$\OO_x:=\{ gx| g \in G\}.$$ And the {\bf stabilizer}
of $x$ is defined as $$ G_x:=\{ g \in G | gx=x \}.$$
\end{defn}

It's immediate to check the following:\\
\begin{lem} Given a group $G$ acting on $S$. For $x,y \in S$, we
have:
1. $G_x < G$.\\
2. either $\OO_x = \OO_y$ or $\OO_x \cap \OO_y = \emptyset$.\\
3. if $y= gx$, then $G_y = g G_x g^{-1}$.
\end{lem}

\begin{prop}
$$ |G|= |\OO_x| \cdot |G_x|.$$
\end{prop}
\begin{proof}[Sketch]
For given $y \in \OO_x$, we consider $S_y:=\{ g \in G| gx=y\}$.
Then $$G = \cup_{y \in \OO_x} S_y, $$ which is a disjoint union.

Furthermore, for each $y \in \OO_x$, we can write  $y=gx$.   Then
one has $S_y= g G_x$. In particular $|S_y|= | G_x|$. We fix a
$g_y$ such that $y=g_y x$ once and for all. We may define a
bijection $ G \to \OO_x \times G_x$ as sets by $g \mapsto (gx,
g(g_{gx})^{-1})$. Thus
$$|G|=|\OO_x| \cdot |G_x|.$$
\end{proof}

\begin{cor} [Lagrange's Theorem]
Let $H< G$ be a subgroup. Then $|G| = |G/H| \cdot |H|$.
\end{cor}

\begin{proof}
We take $S=G/H$ with the action $G \times G/H \to G/H$ via
$\alpha(g,xH)=gxH$. For $ H \in S$, the stabilizer is $H$, and the
orbit is $G/H$. Thus we have $$|G| = |G/H| \cdot |H|,$$ which is
the Lagrange's theorem.
\end{proof}

Another way of counting is to consider the decomposition of $S$
into disjoint union of orbits. Note that if $\OO_x=\OO_y$ if and
only if $y \in \OO_x$. Thus for convenience, we pick a
representative in each orbit and let $I$ be a set of
representatives of orbits. We have a disjoint union:
$$ S= \cup_{x\in I} \OO_x.$$
In particular, $$ |S| = \sum_{x \in I} |\OO_x|.$$

This simple minded equation actually give various nice
application. We have the following natural applications.

\begin{ex}[translation] \end{ex}
Let $G$ be a group. One can consider the action $G \times G \to G$
by $ \alpha(g,x)=gx$. Such action is called translation. More
generally, let $H < G$ be a subgroup. Then one has translation $ H
\times G \to G$ by $(h,x) \mapsto hx$. In this setting, $\OO_x =
Hx$. And the set  of orbits is $G/H$, the right cosets of $H$ in
$G$.  Then $$|S| = \sum_{x \in I} |\OO_x|= |G/H| \cdot |H|$$ gives
Lagrange theorem again. \qed



\begin{ex}[conjugation]\end{ex}
Let $G$ be a group. One can consider the action $G \times G \to G$
by $ \alpha(g,x)=gxg^{-1}$. Such action is called conjugation. For
a $x \in G$, $G_x=C(x)$, the centralizer of $x$ in $G$. And
$\OO_x= \{ gxg^{-1} | g \in G \}$ the conjugacy classes of $x$ in
$G$. So in general, we have
$$ |G| = \sum_{\text{conj. classes}} |C|,$$
which is the {\bf class equation}.

 Now assume that  $G$ is finite. The class equation now reads:
$$ |G|= \sum_{x \in I} |G|/|C(x)|,$$ where $I$ denotes a
representative of conjugacy classes.

And $\OO_x =\{ x\}$ if and only if $x \in Z(G)$, the center of
$G$. So, for $G$ finite, the class equation now gives
$$ |G|=|Z(G)|+ \sum_{x \in I, x \not \in Z(G)} |G|/|C(x)|.$$ Which  is the usual form of class equation.
\qed

The class equation  is very useful if the group is a finite
$p$-group. We recall some definition

\begin{defn}
If $p$ is a prime, then a {\bf $p$-group} is a group in which
every element has order a power of $p$.\\
By a finite $p$-group, we mean a group $G$ with $|G|=p^n$ for some
$n
>0$.
\end{defn}
Consider now $G$ is a finite $p$ group acting on $S$. Let
$$ S_0:=\{ x \in S | gx=x, \forall g \in G \}.$$
Then  the class equation can be written as $$ |S|=|S_0|+\sum_{x
\in I, x \not \in S_0} |\OO_x|.$$ One has the following

\begin{lem}\label{modp}
Let $G$ be a finite $p$-group. Keep the notation as above, then
$$|S| \equiv |S_0| \quad (\text{mod }p).$$
\end{lem}

\begin{proof}
If $x \not \in S_0$, then $ 1 \ne |\OO_x| =p^k$ because
$|G|=|\OO_x| \cdot |G_x|$.
\end{proof}

By consider the conjugation $G \times G \to G$, one sees that
\begin{cor}
If $G$ is a finite $p$-group, then $G$ has non-trivial center.
\end{cor}

By using the similar technique, one can also prove the important
Cauchy's theorem

\begin{thm} [Cauchy]
Let $G$ be a finite group such that $p \mid |G|$. Then there is an
element in $G$ of order $p$.
\end{thm}

\begin{proof}[sketch]
We keep the notation as in Lemma \ref{modp}. Let $$S:=\{
(a_1,...,a_p)| a_i \in G, \prod a_i =e\}.$$ And consider a group
action $\bZ_p \times S \to S$ by $ (1,(a_1,..,a_p)) \mapsto
(a_p,a_1,...,a_{p-1})$. One claims that $S_0=\{ (a,a,...,a)| a \in
G, a^p=e\}$.

By the Lemma, one has $|S| \equiv |S_0| \quad (\text{mod } p )$.
It follows that $p \mid |S_0|$. In particular, $|S_0| >1$, hence
there is $(a,...,a) \in S_0$ with $a \ne e$. One sees that
$o(a)=p$.
\end{proof}

\begin{cor}
A finite group $G$ is a $p$-group if and only it is a  finite
$p$-group.
\end{cor}

\subsection{Sylow's theorems}

\noindent We are now ready to prove Sylow theorems. The first
theorem regards the existence of $p$-subgroups in a given group.
The second theorem deals with relation between $p$-subgroups. In
particular, all Sylow $p$-subgroups are conjugate. The third
theorem counts the number of Sylow $p$-subgroups.

\begin{thm}[First Sylow theorem]
Let $G$ be a finite group of order $p^n m$ (where $(p,m)=1$). Then
there are subgroups of order $p^i$ for all $ 0 \le i \le n$.

Furthermore, for each subgroup $H_i$ of order $p^i$, there is a
subgroup  $H_{i+1}$ of order $p^{i+1}$ such that $H_i \lhd
H_{i+1}$ for $ 0 \le i \le n-1$.
\end{thm}

In particular, there exists a subgroup of order $p^n$, which is
maximal possible, called Sylow $p$-subgroup. We recall the useful
lemma which will be used frequently.
\begin{lem}
Let $G$ be a finite $p$-group. Then
$$|S| \equiv |S_0| \quad (\text{mod }p).$$
\end{lem}

\begin{proof}[proof of the theorem]
We will find subgroup of order $p^i$ inductively. By Cauchy's
theorem, there is a subgroup of order $p$. Suppose that $H$ is a
subgroup of order $p^i$. Consider the group action that $ H$ acts
on $S=G/H$ by translation, i.e. $H \times G/H \to G/H$ by $h(xH):=
hxH$. One shows that $xH \in S_0$ if and only if $xH=hxH$ for all
$h \in H$ if and only if $ x \in N_G(H)$. Thus $|S_0|=|N_G(H)/H|$.

If $i < n$, then
$$ |S_0| \cong |S|=p^{n-i}m \equiv 0 \quad (\text{mod } p).$$ By Cauchy's
theorem, the group $N_G(H)/H$ contains a subgroup  of order $p$.
The subgroup is of the form $H_1/H$, hence $|H_1|=p^{i+1}$.
Moreover, $H \lhd H_1$.
\end{proof}

\begin{ex}
If $G$ is a finite $p$-group of order $p^n$, then one has a series
of subgroups $\{e \} =H_0 < H_1 <...< H_n=G$ such that $|H_i|=p^i$
and $H_i \lhd H_{i+1}, H_{i+1}/H_i \cong \ZZ_p$. In particular,
$G$ is solvable.
\end{ex}

\begin{defn}
A subgroup $P$ of $G$ is a Sylow $p$-subgroup if $P$ is a maximal
$p$-subgroup of $G$.
\end{defn}

If $G$ is finite of order $p^n m$ then a subgroup $P$ is a Sylow
$p$-subgroup if and only if $|P|=p^n$ by the proof of the first
theorem.

\begin{thm}[Second Sylow theorem]
Let $G$ be a finite group of order $p^n m$. If $H$ is a
$p$-subgroup of   $G$, and $P$ is any Sylow $p$-subgroup of $G$,
then there exists  $x \in G$ such that $xHx^{-1} < P$.
\end{thm}

\begin{proof}
Let $S=G/P$ be the set of left cosets and $H$ acts on $S$ by
translation. Thus by  Lemma \ref{modp}, one has $|S_0| \equiv
|S|=m (\text{mod } p)$. Therefore, $S_0 \ne \emptyset$. One has
$$xP \in S_0 \Leftrightarrow hxP=xP \quad \forall h \in H
\Leftrightarrow x^{-1}Hx < P.$$ This completes the proof.
\end{proof}

An immedaitely but important consequence is that any two Sylow
$p$-subgroups are conjugate.

\begin{thm}[Third Sylow theorem]
Let $G$ be a finite group of order $p^n m$. The number of Sylow
$p$-subgroups divides $|G|$  and is of the form $kp+1$.
\end{thm}

\begin{proof}
Let $S$ be the conjugate class of a Sylow $p$-subgroup $P$ (this
is the same as the set of all Sylow $p$-subgroups). We consider
the action that $G$ acts on $S$ by conjugation, then the action is
transitive, i.e. for any $x,y \in S$, there exists $g \in G$ such
that $y=gx$. In particular $\OO_x=S$.  Hence $|S| \mid |G|$ for
$|G|=|G_x| \cdot |\OO_x|$.

Furthermore,  we consider the action $P \times S \to S$ by
conjugation. Then $$Q \in S_0 \Leftrightarrow xQx^{-1}=Q \quad
\forall x \in P \Leftrightarrow P < N_G(Q).$$ Both $P,Q$ are Sylow
$p$-subgroup of $N_G(Q)$ and therefore conjugate in $N_G(Q)$.
However, $Q \lhd N_G(Q)$, $Q$ has no conjugate other than itself.
Thus one concludes that $P=Q$. In particular, $S_0=\{P\}$. By
Lemma \ref{modp}, one has $|S|=1+kp$.
\end{proof}

\begin{ex}\end{ex}
Group of order $200$ must have normal Sylow subgroups. Hence it's
not simple.  To see this, let $r_p:=$ number of Sylow
$p$-subgroups. Then $r_5=1$. So if $P$ is a Sylow $5$-subgroup.
Since $gPg^{-1}$ is also a Sylow subgroup, it follows that
$gPg^{-1} = P$ for all $g \in G$. Thus $P \lhd G$. \qed

\begin{ex} \end{ex}
There is no simple group of order $36$. To see this, we consider
$P$ a Sylow $3$-subgroup. Then $r_3=1$ or $4$. In case that
$r_3=4$, let $S$ be the set of Sylow $3$-subgroups. We have a
group action $G \times S \to S $ by conjugation. Thus we have a
group homomorphism $\varphi: G \to A(S) \cong S_4$. Comparing the
cardinality of groups, one sees that $\varphi$ must have
non-trivial kernel. Hence $G$ is not simple. \qed

\subsection{groups of small order}
We can use the technique developed in the previous sections to
study group of small order in more detail.

First of all, as a direct consequence of Cauchy's theorem,

\begin{prop} Let $p$ be a prime.
A group of order $p$ is cyclic.
\end{prop}

\begin{ex} \end{ex}
Classify groups of order $2p$.

 If $p=2$, then this is well-known.
So we may assume that $p
>2$. \\
First of all there is a subgroup $H<G$ of order $p$, generated by
$x$,  by Cauchy's theorem. By Sylow's third theorem, we have
$r_p=1$, hence $H$ is normal. Similarly, there is an element of
order $2$, say $y$. By normality of $H$, we have $yxy^{-1}= x^k$
for some $k$. Since $$x=y^{2}x y^{-2} = y x^k y^{-1} = x^{k^2},$$
it follows that $k^2 \equiv 1 (\mod p)$. Hence $k \equiv 1$ or
$\equiv -1$. \\
\noindent
 {\bf Case 1.} $k \equiv 1$, then $xy=yx$. It follows
that $G$ is
abelian. By chinese Remainder Theorem, $G$ is cyclic. \\
{\bf Case 2.} $ k \equiv -1$, then $xy=yx^{-1}$. These kind of
group is called {\bf dihedral groups}, denoted $D_{2p}$. \qed


\begin{ex} \end{ex} Let $p,q $ be primes.
If $|G|=pq$, then its structure can be determined similarly.\\
We assume that $p >q$. Then there are $x,y \in G$ of order $p,q$
respectively. Moreover, $H:=<x> \lhd G$.  We have $yxy^{-1}= x^k$
for some $k$. Since $$x=y^{q}x y^{-q} = y x^k y^{-1} = x^{k^q},$$
it follows that $k^q \equiv 1 (\mod p)$.
Now the situation depends on the structure of $\bZ_p^*$. Recall that $\bZ_p^* \cong \bZ_{p-1}$ is cyclic.\\
\noindent
 {\bf Case 1.} $q  \nmid p-1$, then $k^q \equiv 1 (\mod p)$
 implies that $k \equiv 1$. Hence
 $xy=yx$. It follows
that $G$ is
abelian. By chinese Remainder Theorem, $G$ is cyclic. \\
{\bf Case 2.} $ q  \mid p-1$, then $k^q \equiv 1 (\mod p)$ has $q$
solutions, $k \equiv a,a^2,...,a^{q-1}, a^q \equiv 1 $. If we pick
$k \equiv a$, then we determined a group $G_1$ which is generated
by $x_1,y_1$ with $y_1x_1y_1^{-1}=x_1^a$. If we pick $k \equiv
a^2$, then we determined a group $G_2$ which is generated by
$x_2,y_2$ with $y_2x_2y_2^{-1}=x_2^{a^2}$. Note that the map
$\varphi: G_2 \to G_1$ by $\varphi(y_2)=y_1^2, \varphi(x_2)=x_1$
gives an isomorphism. Therefore, for different solution $k \equiv
a,a^2,...,a^{q-1}$, they determined the same group.
 \qed

There is a useful construction to produce groups from simple ones
called {\bf semi-direct product} which we now introduce. Given two
groups $G,H$ and a homomorphism $\theta: H \to \Aut(G)$. Let $G
\times_\theta H$ be the set $G \times H$ with the binary operation
$(g,h) (g',h') =( g (\theta(h)(g')), hh')$. One can verify that
this produce a group.

For example, in the case 2 of above example, we have $G= \bZ_p,
H=\bZ_q$ and we consider $\theta: \bZ_q \to \Aut(\bZ_p) \cong
\bZ_p^*$ by $\theta(1) =a$. Then we obtained $\bZ_p \times_\theta
\bZ_q$. Such group is called a {\bf metacyclic groups}.

\begin{prop}
Let $p$ be a primes. If $|G|=p^2$, then $G$ is abelian.
\end{prop}

We will discuss the structure of finite ableina groups later. In
principle, their structure are pretty easy.

\begin{proof}[sketch]
By class equation,  one sees that  $Z(G)$ is non-trivial.\\
\noindent {\bf Case 1.} if $|Z(G)|=p^2$, then $G$ is abelian.\\
{\bf Case 2.} if $|Z(G)|=p$, then $G/Z(G)$ is a group of order $p$
, hence cyclic. We pick $ x \in G$ such that $G/Z(G)$ is generated
by $x Z(G)$. We also pick $y \in G$ such that $Z(G)$ is generated
by $y$. It's easy to check that $G$ is generated by $x,y$. Note
that $xy=yx$, it follows that $G$ is abelian.
\end{proof}

Using above properties, one can classified groups of order $ \le
15$ completely unless for order $8$ and $12$. In fact groups of
order $8$ are either abelian or $D_8$ or $Q_8$. Where $Q_8$ is the
quaterion group defined by $\{i,j,k,-i,-j,-k,1,-1 |
i^2=j^2=k^2=-1, ijk=-1\}$.

Easy example of non-abelian groups of order $12$ includes $A_4,
D_{12}$. In fact there is one more, $T=<a,b | a^6=b^4=1,
b^2=a^3=(ab)^2 >$.

\begin{thm}
every non-abelian group $G$ of order $12$ is isomorphic to $A_4,
D_{12}$ or $T$.
\end{thm}

\begin{proof}[sketch]
Let $P$ be a Sylow $3$-subgroup. We first consider the action $G
\times G/P \to G/P$ by translation. It gives rise to a
homomorphism $\varphi: G \to A(G/P) \cong S_4$. It's clear that
$\ker(\varphi) < P$.\\
\noindent {\bf Case 1.} $\ker(\varphi) = \{e\}$, then $G \cong
A_4$. \\
{\bf Case 2.} $\ker(\varphi)=P$. Then we need to wok harder. So
now, $P \lhd G$ and $P$ is the unique Sylow $3$-subgroup. Let
$P=\{x,x^2,x^3=e\}$, then $x,x^2$ are the only element in $G$ of
order $3$.

Let $K$
be a Sylow $2$-subgroup, then $K$ is either $V_4$ or $\bZ_4$. \\
{\bf Case 2.i.} If $K \cong V_4$, by computing the relation
between
generators, one can show that $G \cong D_{12}$.\\
{\bf Case 2.ii.} If $K \cong \bZ_4$, by computing the relation
between
generators, one can show that $G \cong T$.\\
\end{proof}

Groups of order $p^n$, $n \ge 3$ could be very complicated. Here
just give two more examples.

\begin{ex} \label{quaterion} \end{ex}
Let $G < GL(2,\bC)$ be the group generated by $A= \left(
\begin{array}{cc} 0 & \omega \\ \omega & 0 \end{array} \right)$ and
$B=\left( \begin{array}{cc} 0 & 1 \\ -1 & 0 \end{array} \right)$,
where $\omega$ is a primitive $2^{n-1}$th root of unity for $n \ge
3$. Then $G$ is a group of order $2^n$. \qed

\begin{ex} \end{ex}
Let $G < GL(3,\bC)$ be the group generated by $A= \left(
\begin{array}{ccc} 1 & 0 & 0 \\ 0 & \omega & 0 \\ 0 & 0 & \omega^2  \end{array} \right)$ and
$B=\left( \begin{array}{ccc} 0 & 1 & 0 \\ 0 & 0 & 1\\ 1 & 0 & 0
\end{array} \right)$, where $\omega$ is a primitive $3$th
root of unity. Then $G$ is a group of order $27$. \qed

\vfill
 \pagebreak
\begin{center}
 Oct. 13, 2006 (Fri.)
\end{center}

\subsection{symmetry of the plane}
A map from plane itself is called a {\bf rigid motion}, or an {\bf
isometry}, if it is distance-preserving. Let $S$ be a subset of
the plane. Then the subgroups of rigid motions preserving $S$ is
called the {\bf symmetry of $S$}. It's well-known that:

\begin{ex} \end{ex}
Let $S$ be the regular $n$-gon centered at the origin. Then the
symmetry of $S$ id the group $D_{2n}$. \qed

In order to build this is a more solid foundation, we need to work
a little bit more.

A list of rigid motions consists of:\\
 \noindent 1. Orientation-preserving motions:\\
 \noindent a. Translation.\\
 \noindent b. Rotation.\\
 \noindent 2. Orientation-reversing motions:\\
 \noindent a. Reflection.\\
 \noindent b. Glide reflection, i.e. reflecting about a line $l$
 and then translating by a non-zero vector $a$ parallel to $l$.

 \begin{thm}
The above list is complete.
 \end{thm}

 \begin{proof}[Sketch]
 We first fix some notations:\\
 $t_a$: translation by a vector $a$.\\
 $\rho_\theta$: rotation by an angle $\theta$ about the origin.\\
 $r$: reflection about the $x$-axis.\\

\noindent
 {\bf Step 1.} Orientation preserving motions that fix the origin
 are $\{\rho_\theta\}$.

\noindent
 {\bf Step 2.} Let $m$ ne an orientation preserving motion. If
 $m(o)= a$, then $ t_{-a} m = \rho_\theta$ for some $\theta$. by Step 1.
 Thus $m = t_a \rho_\theta$.

\noindent
 {\bf Step 3.} If $m$ is not a translation, i.e. $\theta \ne 0$,
 then $m$ is a rotation about a point $p$. To see this, first show
 that $m$ has a fixed point, denoted $p$, if $\theta \ne 0$.
A point on the plane can be written as $p+x$, $$m(p+x) = t_a
\rho_\theta ( p+x) =\rho_\theta ( p+x) +a = \rho_\theta ( p)
+\rho_\theta ( x) +a = p+ \rho_\theta ( x).$$

\noindent {\bf Step 4.} Orientation reversing motions that fix the
origin
 are $\{\rho_\theta  r\}$. For given such $m$, it's clear that $r
 m $ preserves the orientation and fixes the origin. So $r m =
 \rho_\theta$ for some $\theta$. Thus  $m = r \rho_\theta = \rho_{- \theta} r $.
 Also note that $ \rho_\theta r$ is the reflection about $l$,
 denoted $r_l$,
 which is the line obtained by rotating $x$-axis by $\frac{1}{2}
 \theta$.

 \noindent {\bf Step 5.} Let $m$ be an  orientation reversing
 motion. Then $m(o) =a $ for some $a$. Thus $t_{-a} m$ is an  orientation reversing
 motion that fixes origin, hence $t_{-a} m = r_l$. Therefore, $m =
 t_a r_l$ which is a glide reflection.
\end{proof}

Indeed, let $O(2, \bR)$ be the subgroup of motions that fix the
origin. Then $O(2,\bR)$ is generated by $\{ \rho_\theta, r \}$.
Let $M$ be the groups of plane rigid motions, then there is a
 group action $M \times \bR^2 \to \bR^2$. The orbit of $o$ is the
 whole $\bR^2$ and the stabilizer of $o$ is $O(2,\bR)$.

For readers who want to know more about symmetry, we refer
[Artin], Chapter 5.

\subsection{abelian groups}
In this section, we are going to study a simple but important
category of groups, the abelian groups.

Given an abelian group $G$, we usually use $+$ to denote the
operation. We say that $G$ can be generated by $X \subset G$,
denoted $G= <X>$, if every element of $G$ can be written as $\sum
n_i x_i$ for some $n_i \in \bZ$ and $x_i \in X$. Note that $n_i
\ne 0$ for all but finitely many $i$.

A {\bf basis} of an abelian group $G$ is a {\it linearly
independent} generating subset $X$. That is for distinct
$x_1,...,x_k \in X$, $ \sum n_i x_i =0 $ implies that $n_i$ for
all $i$.

An abelian group with a basis is called a {\bf free abelian
group}. And the rank, denoted $rk(F)$, is $|X|$.

It's easy to prove that an abelian group is free if and only if
it's a direct sum of $\bZ$.

On the other hand, given a set $X$, we can always construct a free
abelian group on the set $X$ by consider the set
$$F:=\{ \sum n_x x | x \in X, n_x \in \bZ, n_x = 0 \text{ for all
but finitely many } x \}.$$ The group operation on $F$ is nothing
but $\sum n_x x + \sum m_x x := \sum (n_x+m_x) x$. It's clear that
$X$ is a basis of $F$ in this construction.

\begin{ex} \end{ex}
This construction appeared, for example, in algebraic topology.
The groups of $1$-chains is the free abelian group on the set of
simplicial  $1$-chains. \qed

\begin{ex} \end{ex}
Let $X$ be a Riemann surface, then the group of divisors,
$Div(X)$, is the free abelian group on the set $X$. \qed

It has the following universal property:
\begin{prop}
Let $F$ be a free abelian group with basis $X$. For any function
$f: X \to G$ to an abelian group $G$. There exist a unique
homomorphism $\varphi: F \to G$ extending $f$.
\end{prop}

\begin{proof}
Let $\varphi ( \sum n_x x ) = \sum n_x f(x)$, then verify it.
\end{proof}

\begin{cor}
Every abelian group is a quotient of a free abelian group.
\end{cor}

\begin{proof}
Let$G$ be an abelian group. Let $F$ be the free abelian group on
the set $G$. Consider $f:G \to G$ the identity map. Then we are
done.
\end{proof}

\begin{ex} \end{ex}
$\bQ$ can be describe as following. Let $X= \{ x_1,...,x_n,...\}$
and $F$ the free abelian group on the set $X$. Take $f: X \to \bQ$
by $f(x_i)=\frac{1}{i}$. Then $\bQ$ is a quotient of $F$. \qed

We are now   ready to state develop to main theorem of this
section.  We need the following:

\begin{lem}
If $\{ x_1,...,x_n\}$ is a basis of $F$, then $\{x_1,...,x_{j-1},
x_j+a x_i, x_{j+1},...,x_n\}$ is also a basis of $F$ for $i \ne j$
and $a \in \bZ$.
\end{lem}

\begin{thm}\label{abgp}
Let $F$ be a free abelian group of rank $n$ and $G$ is a non-zero
subgroup of $F$, then there exists a basis $\{x_1,....,x_n\}$ of
$F$, an integer $r$ $(1 \le r \le n)$ and positive integer
$d_1,...,d_r$ such that $d_1|d_2|...|d_r$ and $G$ is free abelian
group with basis $\{d_1x_1,...,d_rx_r\}$.
\end{thm}

\begin{proof}[Sketch]
If $n=1$, this is easy.

By induction, we assume that the theorem is true for all abelian
groups of rank $\le n-1$. Let
$$ S:= \{ s \in \bZ | sy_1+...k_ny_n \in G, \text{ for some basis
of $F$ }, y_1,...,y_n\}.$$

Let $d_1$ be the smallest positive integer in $S$. By changing
basis, we may have $\{x_1, y_2,...,y_n\}$ basis of $F$ and $d_1x_1
\in G$.

Let $H=<y_2,...,y_n>$. It's clear that $F = H \oplus \bZ x_1$. We
claim that $G= (H \cap G) \oplus \bZ d_1 x_1$.

Apply induction hypothesis to $G\cap H < H$, then we are done.
\end{proof}

\begin{cor}[fundamental theorem of finitely generated abelian
groups]\label{ftab} Let $G$ be a finitely generated abelian group.
Then there exist an integer $r$ and positive integers
$d_1|d_2|...|d_t$ such that $$G \cong \bZ_{d_1} \oplus...\oplus
\bZ_{d_t} \oplus \bZ^r.$$
\end{cor}

\begin{proof}
Let $X$ be a finite generating set  of $G$. And let $F$ be the
free abelian group on the set $X$.  Then there is a surjective
homomorphism $F \to G$. Apply Theorem \ref{abgp} to $ \ker < F$.
\end{proof}

Now we restrict ourselves to finite abelian groups. Let $G$ be a
finite abelian group, by Corollary \ref{ftab},
$$G \cong \bZ_{d_1} \oplus ...\oplus \bZ_{d_t}.$$
These $d_1,...,d_t$ are called {\bf invariant factors}. We
consider the factorization of $d_i$ into prime factors, then we
have for all $i$, $$d_i = p_1^{a_{i,1}}...p_k^{a_{i,k}}.$$ By
Chinese Remainder Theorem, we have for all $i$,
$$ \bZ_{d_i} \cong \bZ_{p_1^{a_{i,1}}} \oplus ... \oplus
\bZ_{p_k^{a_{i,k}}}.$$ Therefore,
$$ G \cong \oplus_{j=1}^{k} ( \oplus_{i=1}^{t}
\bZ_{p_j^{a_{i,j}}}).$$ It's clear that $\oplus_{i=1}^{t}
\bZ_{p_j^{a_{i,j}}}$ is the Sylow $p_j$-subgroup. And these
$p_j^{a_{i,j}}$ are called {\bf elementary divisors}.

\begin{ex} \end{ex}
Let $G= \bZ_{100} \oplus \bZ_{40}$. By Chinese Remainder Theorem,
$\bZ_{100} \cong \bZ_{4} \oplus \bZ_{25}$ and $\bZ_{40} \cong
\bZ_{8} \oplus \bZ_5$. Thus
$$ G \cong \bZ_{4} \oplus \bZ_{8} \oplus  \bZ_5 \oplus
\bZ_{25} \cong  \bZ_{20} \oplus \bZ_{200}.$$ So invariant factors
are $20, 200$ and elementary divisors are $4,8,5,25$. \qed

\begin{ex} \end{ex}
Let $G = \bZ_m \oplus \bZ_n$. Then invariant factors are
$(m,n),[m,n]$, the gcd and lcm of $m,n$. \qed


\vfill
 \pagebreak
\begin{center}
 Oct. 20, 2006 (Fri.)
\end{center}

Let $G$ be an abelian group, there there is a natural important
homomorphism $ m : G \to G $ by $m(x):=mx$ for $m \in \bN$. The
image is denoted $mG$ and kernel is denoted $G[m]$. Let $G(p) = \{
u \in G| o(u)=p^n \text{ for some } n \ge 0\}$.  One can show that
$G(p)$ is the Sylow $p$-subgroup of $G$. And $G$ is a direct sum
of Sylow subgroups. Thus it remains to study finite abelian
$p$-groups. The only non-trivial part of classical theory is
showing that a finite abelian $p$-group is a direct sum of cyclic
$p$-groups.

We also remark that for a given finitely generated abelian group
$G$, the rank, invariant factors, and elementary divisors are
unique. To see this, we proceed as following steps:\\
\noindent 1. if $\bZ^n \cong \bZ^m$, then $n=m$.\\
To see this, let $G \cong \bZ^n \cong \bZ^m$. We consider $G/2G
\cong \bZ_2^n \cong \bZ_2^m$. Thus $n=m$.

\noindent 2. let $G_{tor}:=\{ u \in G | m u =0 \text{ for some } m
\}$. It's clear that $G_{tor} < G$.


\noindent 3. If
$$G_1  = \bZ_{d_1} \oplus...\oplus
\bZ_{d_t} \oplus \bZ^r,$$
$$\cong G_2=\bZ_{d'_1} \oplus...\oplus
\bZ_{d'_{t'}} \oplus \bZ^{r'}$$ Then clearly, $ {G_1}_{tor} \cong
{G_2}_{tor}$ and also $G_1/ {G_1}_{tor}=\bZ^r \cong G_2
/{G_2}_{tor}=\bZ^{r'}$. Hence in particular $r=r'$.



\noindent 4. It remains to show that $t=t'$ and $d_i=d'_i$. \\
To see this, it's equivalent to show the uniqueness of elementary
divisors of finite abelian groups. So now we assume that $G$ is
finite abelian group. Also note that if $G_1 \cong G_2$, then
$G_1(p) \cong G_2(p)$. Thus we may even assume that $G$ is a
finite abelian $p$-group.

Suppose now that
$$ G_1:= \bZ_{p^{a_1}} \oplus ... \oplus \bZ_{p^{a_t}}$$
$$ \cong G_2:= \bZ_{p^{b_1}} \oplus ... \oplus \bZ_{p^{b_s}},$$
with $a_1  \le a_2 \le ... \le a_t, b_1  \le b_2 \le ...\le b_s$.

Then we have $pG_1 \cong p G_2$ and $G_1/ p G_1 \cong G_2 /pG_2$.
Note that $G_1/ pG_1 \cong \bZ_p^{c_1}$, with $c_1=\{ i | a_i > 1
\}$. It follows that $c_1(G_1) = c_1 (G_2)$. Similarly, we can
define $c_k:=\{ i | a_i > k \}$ and $c_k(G_1) = c_k(G_2)$.

Moreover, $G_1[p]  \cong \bZ_p^t \cong G_2[p] \cong \bZ_p^s$.
Hence $t=s$.

Since $t, c_1(G_1),c_2(G_1)...$ determine $a_1,...,a_t$ uniquely
and $s, c_1(G_2),c_2(G_2)...$ determine $b_1,...,b_s$ uniquely. It
follows that $t=s$ and $a_i=b_i$ for all $i$.

\vfill \pagebreak

\subsection{Nilpotent groups, solvable groups}


 \noindent
 Given a group $G$, if $G$ has a normal subgroup $N$,
then we have a quotient group $G/N$. One can expect that knowing
$N$ and $G/N$ would give some information on $G$. In this section,
we are going to introduce the general technique of this idea.

Let $G$ be a group. If $G$ has no non-trivial normal subgroup,
then $G$ is said to be {\bf simple}.

In general, there are two natural way to produce normal subgroups.
The first one is the  the center $Z(G)$. It is a normal subgroup
of $G$. And we have the canonical projection $G \to G/Z(G)$. Let
$C_2(G)$ be the inverse image of $Z( G/Z(G))$ in $G$. By the
correspondence theorem, $Z(G/Z(G))$ is a normal subgroup of
$G/Z(G)$ hence $C_2(G)$ is a normal subgroup of $G$. And then let
$C_3(G)$ to be the inverse image of $Z(G/C_2(G))$. By doing this
inductively, one has an ascending chain of normal subgroups
$$\{e\} < C_1(G):=Z(G) < C_2(G) <...$$
Notice that by the construction, each $C_i(G) \lhd G$ and
$C_{i+1}(G)/ C_i(G)$ is abelian.

\begin{defn}
$G$ is nilpotent if $C_n(G)=G$ for some $n$.
\end{defn}

\begin{prop}
A finite $p$-group is nilpotent.
\end{prop}

\begin{proof}
We use the fact that a finite $p$-group has non-trivial center.
Thus one has $C_i \lneqq C_{i+1}$. The group $G$ has finite order
thus the ascending chain must terminates, say at $C_n$. If $C_n
\ne G$, then $G/C_n$ has non-trivial center. One has $C_n \lneqq
C_{n+1}$ which is impossible. Hence $C_n=G$.
\end{proof}

\begin{thm}
If $H,K$ are nilpotent, so is $H \times K$.
\end{thm}

\begin{proof}
The key observation is that $Z(H \times K) = Z(H) \times Z(K)$.
Then inductively, one proves that $C_i(H \times K) = C_i(H) \times
C_i (K)$. If $C_n(H)=H, C_m(K)=K$ then $C_l (H \times K)$ for
$l=max(m,n)$.
\end{proof}

\begin{lem}
Let $G$ be a nilpotent group and $H \lneq G$ be a proper subgroup.
Then $H \lneq N_G(H)$.
\end{lem}

\begin{proof} Let $C_0(G)=\{e\}$.
Let $k$ be the largest index such that $C_k(G) <H$. Then
$C_{k+1}(G) \not < H$. Pick $a \in C_{k+1} -H$, then for every $h
\in H$, we have $C_k ha = C_k h C_k a = C_k a C_k h= C_k ah$ for $
C_{k+1}/C_k = Z ( G / C_k(G))$. Thus $aha^{-1} \in C_k h \subset
H$ for all $h \in H$. That is $a \in N_G(H) -H$.
\end{proof}
Then we are ready to prove the following:

\begin{thm}
A finite group is nilpotent if and only if it's a direct product
of Sylow $p$-subgroups.
\end{thm}

\begin{proof}
By the previous two results, it's clear that a direct product of
Sylow $p$-subgroups is nilpotent.

Conversely, if $G$ is nilpotent, then we will prove that every
Sylow $p$-subgroup is a normal subgroup of $G$. By checking the
decomposition criterion, one has the required decomposition.

It remains to show that if $P$ is Sylow $p$-subgroup, then $P \lhd G$. \\
To this end, it suffices to prove that $N_G(P)=G$. By applying
this Claim to $N_G(P)$, then it says that $N_G(P)$ can't be a
proper subgroup of $G$ since $N_G( N_G(P))=N_G(P)$. Thus it
follows that $N_G(P)=G$.
\end{proof}

\begin{ex} \end{ex}
Let $G= D_{12}=\{x^iy^j| x^6=y^2=e, xy=yx^5\}$. One of it's Sylow
$2$-subgroup is $\{e, x^3, y, x^3y\}$ isomorphic to $V_4$ and it's
Sylow $3$-subgroup is $\{e, x^2,x^4\} \cong \bZ_3$.

However $Z(G) = \{e, x^3\}$ and $G/Z(G) \cong D_6 \cong S_3$ and
$Z(S_3)=\{e\}$. Thus $G$ is not nilpotent. And therefore, $D_{12}
\not \cong V_4 \times \bZ_3$. \qed

We have seen that we have a series of subgroup by taking centers.
Another natural construction is to take commutators.

\begin{defn}
Let $G$ be a group. The commutator of $G$, denoted $G'$ is the
subgroup generated by the subset $\{aba^{-1}b^{-1}|a,b \in G\}$.
\end{defn}

Roughly speaking, the subgroup $G'$ measures  the
non-commutativity of a group. More precisely, $G'= \{e\}$, if and
only  $G$ is abelian. The smaller $G'$, the more commutative it
is.

\begin{prop} We have:\\
1. $G' \lhd G$,\\
2. and $G/G'$ is ableian.\\
3. if $N \lhd G$, then
 $G/N$ is abelian if and only if $ G' < N$.
\end{prop}

\begin{proof}
1.)  for all $g\in G$, $g(aba^{-1}b^{-1})g^{-1} \in G'$, hence
$gG'g < G'$. So $G' \lhd G$.

\noindent 2.) $aG'bG'=abG'=ab(b^{-1}a^{-1}ba)G'=baG'=bG'aG'.$\\
\noindent 3.) Consider $\pi : G \to G/N$. If $G/N$ is abelian,
then $\pi(aba^{-1}b^{-1})=e$, hence $G'<N$. Conversely, if $G'<N$,
we have a surjective homomorphism $G/G' \to G/N$. $G/G'$ is
abelian, hence so is it homomorphic image $G/N$.
\end{proof}
\begin{defn}
We can define the the commutator inductively, i.e.
$G^{(2)}:=(G')',etc$. The $G^{(i)}$ is called the $i$-th derived
subgroup of $G$. It's clear that $G > G'>G^{(2)} >...$.

A group is solvable is $G^{(n)}=\{e\}$ for some $n$.
\end{defn}

\begin{ex} \end{ex}
Take $G=S_4$. The commutator is the smallest subgroup that $G/G'$
is abelian. Since the only non-trivial normal subgroups of $S_4$
are $V,A_4$. It's clear that $G'=A_4$ (Or one can prove this by
hand). Similarly, one finds that $G^{(2)}=A_4'=V$, and
$G^{(3)}=\{e\}$. Hence $S_4$ is solvable. \qed

Another useful description of solvable groups is the groups with
{\it solvable series}.
\begin{defn}
A groups $G$ has a subnormal series if there is a series of
subgroups of $G$
$$ G=H_0 > H_1 >H_2>...>H_n,$$
such that $H_{i} \lhd H_{i-1}$ for all $ 1 \le i \le n$.

A subnormal series is a solvable series if $H_n=\{e\}$ and $
H_{i-1}/H_{i}$ is abelian for all $1 \le i \le n$.

A subnormal series is a normal series if all $H_i$ are normal
subgroups of $G$.
\end{defn}

\begin{thm}
A group is solvable if and only it has a solvable series.
\end{thm}

\begin{proof}
It's clear that $G> G'>...G^{(n)}=\{e\}$ is a solvable series.  It
suffices to prove that a group with a solvable series is solvable.
Suppose now that $G$ has a sovable series $\{e\}=H_n < ...<H_0=G$.
First observe that $G' < H_{1}$ since $G/H_{1}$ is abelian. We
claim that $G^{(i)}<H_{i}$ for all $i$ inductively. Which can be
proved  by the observation that the intersection of the series
$\{e\}=H_n < ...<H_0=G$ with $G^{(i)}$ gives a solvable series of
$G^{(i)}$.
\end{proof}

\begin{ex} \end{ex}
A finite $p$-group has a solvable series, hence is solvable.

Moreover, a nilpotent group is solvable. To see this, let $G$ be a
nilpotent group. Then there exist a series $$\{e\} < C_1(G):=Z(G)
< C_2(G) <...< C_n(G)=G.$$ Notice that $C_{i+1}(G)/ C_{i}(G) = Z(
G/ C_{i}(G))$ is abelian. Therefore this is a solvable series.
\qed

\vfill
 \pagebreak

\begin{center}
 Oct. 27, 2006 (Fri.)
\end{center}

\begin{prop}
Let $H$ be a subgroup of a solvable group $G$, then $H$ is
solvable.

Let $N$ be a normal subgroup of $G$. Then $G$ is solvable if and
only if both $N$ and $G/N$ are solvable.
\end{prop}

\begin{proof}[Sketch]
$G$ has a solvable series, intersecting the series with $H$  gives
a solvable series of $H$.

If $N \lhd G$, then we have $\pi : G \to G/N$. Projecting the
solvable series of $G$ to $G/N$ gives a solvable series of $G/N$.

Finally, if $N$ and $G/N$ are solvable, they have solvable series
respectively. Apply $\pi^{-1}$ to the solvable series of $G/N$
gives a series from $N$ to $G$. Combine this series with the
serious of $H$ gives a solvable series of $G$.
\end{proof}

\begin{ex} \end{ex} We will prove in the coming subsection that
$A_5$ is not solvable, hence so is $S_n$ for $n \ge 5$. \qed



\subsection{normal and subnormal series}
We turning back to series a little bit more. A subnormal series is
called a composition series if every quotient is a simple group.

\begin{defn}
 For a subnormal series, $\{e\}=H_n < ...<H_0=G$, the {\it
factors} of the series are the quotient groups $H_{i-1}/H_{i}$ and
the {\it length} is the number of non-trivial factors. A {\it
refinement} is a series obtained by finite steps of {\it one-step
refinement} which is  $\{e\}=H_n < .<K<..<H_0=G$.
\end{defn}

\begin{defn}
Two series are said to be equivalent if there is a one-to-one
correspondence between the non-trivial factors. And the
corresponding factors groups are isomorphism.
\end{defn}

It's clear that this defines an equivalent relation on subnormal
series.

The main theorems are
\begin{thm}[Schreier]
Any two subnormal (resp. normal) series of a group $G$ have a
subnormal (resp. normal) refinement that are equivalent.
\end{thm}

An immediate corollary is the famous Jordan-H\"older theorem.

\begin{thm}[Jordan-H\"older] Any two composition series of a group
are equivalent.
\end{thm}

The main technique is the Zassenhaus Lemma, or sometimes called
butterfly Lemma.

\begin{lem}[Zassenhaus]
Let $A^* \lhd A$ and $B^* \lhd B$ be subgroups of $G$. Then
\begin{enumerate}
\item $A^*(A \cap B^*) \lhd A^*(A \cap B)$.

\item $B^*(A \cap B) \lhd B^*(A \cap B)$.

\item $A^*(A \cap B)/A^*(A \cap B^*) \cong B^*(A \cap B)/B^*(A^*
\cap B)$.
\end{enumerate}
\end{lem}

\begin{proof}[Sketch]
It's clear that $A\cap B^* = (A \cap B) \cap B^* \lhd A \cap B$.
And similarly, $A^* \cap B \lhd A \cap B$. Let $D=(A\cap
B^*)(A^*\cap B) \lhd A\cap B$. One can have a well-defined
homomorphism $f: A^*(A \cap B) \to A\cap B /D$ with kernel $A^*(A
\cap B^*)$. And similarly for the other homomorphism.
\end{proof}

\begin{proof}[proof of Schreier's theorem]
Let $\{e\}=G_{n+1}<...<G_0=G$ and $\{e\}=H_{m+1}<...<H_0=G$ be two
subnormal series. Let $G(i,j):=G_{i+1}(G_i \cap H_j)$  (resp.
$H(i,j):=H_{j+1} (G_i \cap H_j)$). Then one has a refinement
$$ G=G(0,0) > G(0,1)>...>G(0,m) > G(1,0) >...> G(n,m),$$
$$ G=H(0,0) > H(1,0)>...>H(n,0) > H(0,1) >...> H(n,m).$$
By applying Zaseenhaus Lemma to $G_{i+1},G_i,H_{j+1},H_j$, one has
$$ G(i,j)/G(i,j+1) \cong H(i,j)/H(i+1,j).$$
\end{proof}

\subsection{simplicity of $A_5$}
An element in $S_n$ is said to be have cycle structure
$(m_1,..,m_r)$ with $m_1 \ge m_2 \ge...\ge m_r$ , $m_1+...+m_r=n$
if its cycle decomposition is of length $m_1,...,m_r$
respectively. For example, $(1,2)(3,4) \in S_4$ has cycle
structure $(2,2)$ and $(1,2) \in S_4$ has cycle structure
$(2,1,1)$.

\begin{rem}
There is a one-to-one correspondence between cycle structures of
$S_n$ and partition of the integer $n$.
\end{rem}

A key observation is that any two elements are conjugate to each
other if and only if they have the same cycle structure. Let's
call the set of all elements of cycle structure $(m_1,...,m_r)$
the cycle class of $(m_1,...m_r)$. A consequence of this fact is
that a subgroup $N < S_n$ is normal  if and only if $N$ is union
of cycle classes.

Let's put it another way, given a group $G$, we can always
consider the group action $G \times G \to G$ by conjugation. The
conjugate classes are the orbits. A subgroup $H <G$ is normal if
and only if it is union of orbits. If $G=S_n$, then orbits are
cycle classes.

\begin{ex}
In $S_4$, $V$ is the union of class $(1,1,1,1)$ and $(2,2)$. $A_4$
is the union of $V$ and the class $(3,1)$.
\end{ex}

The purpose of this subsection is to show that $A_5$ is a simple
non-abelian group, hence a non-solvable group.

\begin{thm}
$A_5$ is a simple non-abelian group.
\end{thm}

\begin{proof}
One note that in $S_5$, possible cycle structures are
$(5),(4,1)$,$(3,1$ $,1)$,$(3,2),(2,2,1),(2,1,1,1),(1,1,1,1,1)$
with $24,30,20,20,15,10,1$ elements in each class. While $A_5$ is
the union of classes of $(5),(3,1,1),(2,$ $2,1),(1,1,1,1,1)$.

We consider the actions of conjugation $ \alpha:S_5 \times A_5 \to
A_5$ and its restriction $\beta: A_5 \times A_5 \to A_5$. For
$\sigma \in A_5$, let $\OO_{\alpha,\sigma}$ be the orbit of the
$\alpha$ and $\OO_{\beta,\sigma}$ be the orbit of the $\beta$. And
let $G_{\alpha,\sigma}, G_{\beta,\sigma}$ be the stabilizer.

It's clear that $G_{\alpha,\sigma}=C_{S_5}(\sigma)$ and
$G_{\beta,\sigma}=C_{A_5}(\sigma)=C_{S_5}(\sigma) \cap A_5$. Thus
we have either $|G_{\beta,\sigma}|=\frac{1}{2}
|G_{\alpha,\sigma}|$ or $|G_{\beta,\sigma}|=|G_{\alpha,\sigma}|$.
Hence $|\OO_{\beta,\sigma}|=|\OO_{\alpha,\sigma}|$ or
$|\OO_{\beta,\sigma}|=\frac{1}{2} |\OO_{\alpha,\sigma} |$.

{\bf case 1.} If $\sigma$ has cycle structure $(5)$, then
$|\OO_{\alpha,\sigma} |=24, |G_{\alpha,\sigma}|=5$. It follows
that $|G_{\beta,\sigma}|=5$ and hence $|\OO_{\beta,\sigma}|=12$.

{\bf case 2.} If $\sigma$ has cycle structure $(3,1,1)$, then
$|\OO_{\alpha,\sigma} |=20, |G_{\alpha,\sigma}|=6$. However, one
notice that there is an element $\tau \in
C_{S_5}(\sigma)-C_{A_5}(\sigma)$ (e.g. $(45)(123)=(123)(45)$).
Hence $|G_{\beta,\sigma}| \ne |G_{\alpha,\sigma}|$ and must be
$\frac{1}{2} |G_{\alpha,\sigma}|=3$. Therefore
$|\OO_{\beta,\sigma}|=20$.

{\bf case 3.} If $\sigma$ has cycle structure $(2,2,1)$,then
$|\OO_{\alpha,\sigma} |=15, |G_{\alpha,\sigma}|=8$. It follows
that $|\OO_{\beta,\sigma}|=15$.

Combining all this, if $H< A_5$ is a normal subgroup, then
$|H|=1+12 r_1 + 20 r_2+15 r_3$, where $r_i$ are integers. Moreover
$|H| \mid |A_5|=60$, which is impossible unless $|H|=1 \text{ or }
60$.
\end{proof}

\subsection{simple linear groups}
We have seen that $A_5$ is a simple group. Another important
source of simple groups is via the linear groups.

We first introduce some notions.  Let $V$ be a $m$-dimensional
vector space over a field $K$. Then the {\bf general linear group}
$GL(V)$ is the group of all non-singular linear transformations on
$V$. If we choose a basis $\{e_1,...,e_m\}$ of $V$, then a
non-singular linear transformation can be represented as a
non-singular matrix in $GL(m,K)$.  If $K$ is a field of $q$
elements ( thus unique up to isomorphism, which we will see
later), then we may write $GL(m,q)$ instead.

\begin{prop}
$|GL(m,q)| = (q^m-1)(q^m-q)...(q^m-q^{m-1})$.
\end{prop}

\begin{proof}
Let $\{e_1,...,e_m\}$ be a basis and $A$ a $m\times m$ matrix. $A$
is non-singular if and only  $\{ Ae_1,...,Ae_m \}$ is again a
basis. Or equivalently,   $\{ Ae_1,...,Ae_m \}$ is linearly
independent. $Ae_1$ can have anything but zero, thus there are
$q^m-1$ choices.  And then $Ae_2$ can be anything independent of
$Ae_1$, thus there are $q^m-q$ choices. Inductively, we get the
formula.
\end{proof}

A matrix (or linear transformation) is called {\bf unimodular} if
determinant is $1$. Let $SL(V)$, (resp. $SL(m,K)$ ) be the
subgroups of unimodular matrices. An {\it elementary transvection}
$B_{ij}(\lambda)$ is a matrix which is $1$ along diagonal,
$\lambda$ as its $ij$ entry, and $0$ elsewhere. A {\bf
transvection} is a matrix $B$ such that is similar (which is
conjugate in group theory) to some $B_{ij}(\lambda)$. Note that
$B_{ij}(\lambda)^{-1} = B_{ij}(-\lambda)$.

\begin{lem}
If $A \in GL(m,K)$ with $\det A = \mu$, then $A = U D(\mu)$, where
$U$ is a product of elementary transvections and
$D=diag(1,...,1,\mu)$.
\end{lem}

\begin{proof}[Sketch]
Performing elementary row operations by multiplying elementary
transvections on the left. One sees that it reaches a matrix of type
$D(\mu)$.

For example, we look at first column. Assume that $a_{21}\ne 0$.
Then multiply $B_{12}(a_{21}^{-1}(1-a_{11}))$, one gets a matrix
$A'$ with $A'_{11}=1$. Then multiply $B_{21}(-a_{21})$, the one gets
a matrix $A''$ with $A''_{11}=1,A''_{21}=0$.
\end{proof}

\begin{prop}
We have:\\
\noindent 1. $GL(m,K)$ is a semi-direct product of $SL(m,K)$ by
$K^*$.

\noindent 2. $SL(m,K)$ is generated by elementary transvections.
\end{prop}

\begin{proof}
1. Consider $\det : GL(m,K) \to K^*$. It's clear that this is a
group homomorphism with kernel $SL(m,K)$. Hence $SL(m,K) \lhd
GL(m,K)$. On the other hand, $\Delta:=\{ D(\mu)| \mu \in K^*\} <
GL(m,K)$ and $\Delta \cong K^*$. One can verify that
$GL(m,K)=SL(m,K) \Delta$ by the abbove Lemma. And it's clear that
$SL(m,K) \cap \Delta = \{e\}$. Thus, we are done.

\noindent 2. This follows immediately from above Lemma.
\end{proof}

We now introduce more notations. Let $Z(m,K)$ (resp. $Z(V)$) be the
center of $GL(m,K)$. Then it's easy to see that $Z(m,K)$ is nothing
but scalar matrices. Let $SZ(m,K)=Z(m,K) \cap SL(m,K)$, the group of
unimodular scalar matrices. One can also verify that
$Z(SL(m,K))=SZ(m,K)$.

In order to compute the cardinality of $SZ(m,K)$, we recall the
following fact:

\begin{prop} Let $K$ be a field.\\
\noindent 1. $x^n=1$ has at most $n$ solutions in $K$.

\noindent 2. Every finite subgroup of $K^*$ is cyclic. In
particular, if $K$ is finite, then $K^*$ is cyclic.
\end{prop}

As a result, if $K$ is a finite field of $q$ elements, then $x^m=1$
has exactly $(q-1,m)$ solutions. Thus $SZ(m,q) = (q-1,m)$.

Let $PGL(V):= GL(V)/ Z(V)$ and $PSL(V):= SL(V)/SZ(V)$. Then we
have
$$ |PGL(m,q)|= |SL(m,q)|=(q^m-1)(q^m-q)...(q^m-q^{m-1}) / (q-1),$$
$$ |PSL(m,q)| =(q^m-1)(q^m-q)...(q^m-q^{m-1}) / d(q-1),$$
where $d= (q-1,m)$.

We now give some more example of finite simple groups.

\begin{thm}
The group $PSL(2,q)$ are simple if and only if $q >3$.
\end{thm}

\begin{proof}
If $q=2,3$, then $|PSL(2,2)|=6, |PSL(2,3)|=12$. Hence they are not
simple.

Assume now that $q \ge 4$. Let $N \lhd PSL(2,q)$ and $H \lhd
SL(2,q)$ be its preimage. It is enough to show that if $SZ(m,q)
\lneq H < SL(m,q)$, then $H=SL(m,q)$.

\noindent 1. For any matrix $A \in H  - SZ(m,q)$.
 Then its rational canonical form is either $\left[ \begin{array}{cc} \alpha & 0 \\ 0 &
 \alpha^{-1}
 \end{array} \right]$ or $\left[ \begin{array}{cc} 0 & -1 \\ 1 & \beta
 \end{array} \right]$.

\noindent 2. In either case, $H$ contains a matrix of the form
$\left[
\begin{array}{cc} \alpha & 0 \\ \beta &
 \alpha^{-1}
 \end{array} \right]$ with $\alpha \ne \pm1$.

 To see this, it remains to consider $A$ in the second case. We assume $A= \left[ \begin{array}{cc} 0 & -1 \\ 1 & \beta
 \end{array} \right]$. Then $ TA T^{-1}A^{-1} = \left[ \begin{array}{cc} \alpha^{-2} & 0 \\ \beta(\alpha^2-1)  &
 \alpha^2
 \end{array} \right] \in H$ for $T=\left[ \begin{array}{cc} \alpha & 0 \\ 0 &
 \alpha^{-1}
 \end{array} \right]$ . We can pick $\alpha$ so that $\alpha^2 \ne
 \pm 1$ (unless $q=5$, this case need some extra care).

 \noindent 3. Let $B=B_{21}(1)$, $A= \left[
\begin{array}{cc} \alpha & 0 \\ \beta &
 \alpha^{-1}
 \end{array} \right]$ with $\alpha \ne \pm1$. Then $H$ contains
 $BAB^{-1}A^{-1}=B_{21}(1-\alpha^{-2})$, an elementary tranvection with $1-\alpha^{-2} \ne 0$.

 \noindent 4. If $H$ contains $B_{21}(\mu)$, then $ U B_{21}(\mu)
 U^{-1} = B_{12}(-\mu)$ for $U =\left[
\begin{array}{cc} 0 & -1 \\ 1 &
 0
 \end{array} \right]$.

 \noindent 5. It remains to show that $H$ contains $B_{12}(\nu)$
 for all $\nu \in K$ since $SL(m,q)$ is generated by
 transvections.

 To see this, note that
 $$ \left[
\begin{array}{cc} \alpha & \beta \\ 0 &
 \alpha^{-1} \end{array} \right]    \left[  \begin{array}{cc} 1 & \mu \\ 0 & 1 \end{array} \right]  \left[
\begin{array}{cc} \alpha & \beta \\ 0 &
 \alpha^{-1} \end{array} \right]^{-1} =  \left[
\begin{array}{cc} 1 & \mu \alpha^2 \\ 0 &
1 \end{array} \right].$$

Let $G=\{0\} \cup \{ \mu  \in K | B_{12}(\mu) \in H\}$. It's clear
that $G$ is an additive group and  contains all elements of the
form $\mu (\alpha^2-\beta^2)$.

We claim that $G=K$.

If $char(K) \ne 2$, then $\nu = (\frac{1}{2}(\nu +1))^2 -
(\frac{1}{2} (\nu -1))^2$. Thus for given $\nu \in K$, $\nu
\mu^{-1} = \xi^2-\zeta^2$. It follows that $\nu \in G$.

If $char(K)=2$, then $|K^*|$ is a cyclic group of odd order. Thus
for $\nu \in K^*$, $\nu \mu^{-1} \in K^*$ and $\nu \mu^{-1} =
\zeta^2$ for some $\zeta$. Thus, $\nu = \mu \zeta^2 \in G$.
\end{proof}

\begin{ex} \end{ex}
On can even show that $A_n$ is simple for $n \ge 5$. \qed

\begin{ex} \end{ex}
$|PSL(2,4)|=|PSL(2,5)|=60$. And they are simple. So In fact, we
have $ PSL(2,4) \cong PSL(2,5) \cong A_5$. \\
$|PSL(2,7)|=168$, so it can not be $A_n$. \\
$PSL(2,9) \cong A_6$. \qed

We finally give some more results concerning simple groups.
However, we are not going to prove these.

\begin{thm} [Jordan-Dickson] If $m \ge 3$ and $V$ is an
$m$-dimensional vector space over a field $K$, then $PSL(V)$ is
simple.
\end{thm}

\begin{prop}
$PSL(3,4)$ and $A_8$ are non-isomorphic simple groups of the same
order.
\end{prop}


\vfill
 \pagebreak

\begin{center}
 Nov. 3, 2006 (Fri.)
\end{center}
\section{field theory}

\subsection{definitions and basic properties}
A field $F$ is a set together two binary operation $+,*$ such that
$(F,+)$ is an abelian group with identity $0$,  $(F^*:=F-\{0\},
*)$ is an abelian group with identity $1$, and satisfying
$a*(b+c)=a*b+a*c$.

Let $E,F$ be fields, a homomorphism of fields is nothing but a
ring homomorphism $\varphi: E \to F$. Note that $\varphi(1_E)=1_F$

\begin{ex} \end{ex} Let $p$ be a prime. Then $\bZ_p$ is a field.
Let $F$ be a field of $p$ elements, then clearly there is an
isomorphism $F \cong \bZ_p$ (by sending $1_{\bZ_p}$ to $1_F$).
Thus we usually say {\it the} field of $p$-elements and denoted
$\bF_p$. \qed

Give a field $F$, let $P$ be its minimal (non-zero) subfield. Then
we have:
\begin{prop}
$P$ is isomorphic to either $\bQ$ or $\bF_p$.
\end{prop}

\begin{proof}
Consider the additive subgroup $H$ generated by $1_F$, then $H$ is
either $\bZ$ or $\bZ_p$. If it's $\bZ_p$ then this is exactly $P$.
And if $H=\bZ$, then one can show that $P \cong \bQ$.
\end{proof}

\begin{defn}
The minimal subfield if called the {\bf prime field } of $F$. If
the prime field is $\bF_p$, then we say that $F$ has
characteristic $p$, denoted $\chr(F)=p$. Otherwise, we say that
$F$ has characteristic $0$, denoted $\chr(F)=0$.
\end{defn}

The most important feature for field of characteristic $p$ is that
it has a non-trivial {\it Frobenius map} $\varphi: F \to F,
\varphi(x) \mapsto x^p$. To verify that this is an homomorphism,
we need to check that $\varphi(x)+\varphi(y)=\varphi(x+y)$. Note
that $px =0$ for all $x \in F$ and thus $n x =0$ for all $n$
divisible by $p$. It follows that $C^{p}_i x =0$ for all $ 0 < i <
p$ and all $x \in F$. Hence $(x+y)^p= x^p + y^p$.

In fact, the FRobenius map is always injective for if $x^p=y^p$,
then $x^p-y^p= (x-y)^p =0$. Thus $x-y=0$.

\begin{ex} \end{ex} We have the following important construction
of fields. Let $F$ be a field, $F[x]$ be the polynomial ring. Let
$p(x) \in F[x]$ be an irreducible polynomial.  We claim that
$F[x]/ (p(x))$ is a field.

Recall that there is a division algorithm on $F[x]$. That is,
given $f(x), g(x) \ne 0 \in F[x]$, there exist $q(x),r(x) \in
F[x]$ such that $ f(x)= g(x)q(x) +r(x)$ with either $r(x)=0$ or
$deg(r(x)) < deg(g(x))$. (This shows that $F[x]$ is an Euclidean
domain (E.D.).)

With this properties, one can show that every ideal is of the form
$(f(x))$, i.e. $F[x]$ is a principal ideal domain (PID). For a
given ideal $I \lhd F[x]$, this can be achieved by pick $f(x) \in
I$ of minimal degree. For any $g(x) \in I$, performing the
division algorithm, one sees that $r(x)=0$ for otherwise one gets
a polynomial of even smaller degree, which is absurd.

One method is to show that $(p(x)) lhd F[x]$ is a maximal ideal.
Suppose we have  $ (p(x)) < \frak{m} \lneq F[x]$. Since
$\frak{m}=(f(x))$, it follows that $p(x) \in (f(x))$ and thus
$p(x)= f(x)g(x)$. $p(x)$ is irreducible implies that $f(x)=c p(x)$
for some $c \in F$. Anyway, $(p(x)) = (f(x))$.

Or explicitly, a non-zero element in  $ F[x]/(p(x))$ is of the
form $\overline{f(x)}$ for some $f(x) \in F[x]$ and $f(x) \not \in
(p(x))$. Thus $(f(x),p(x))=1$. By the division algorithm, there
exists $s(x),t(x)$ such that $1= s(x) f(x) + t(x) p(x)$. Hence
$\overline{f(x)} \overline{s(x)} =1$.

If $n=deg(p(x))$, then the element in the field $F[x]/(p(x))$ can
be written as $ \{ a_0+ a_1 \bar{x}+...a_{n-1}\bar{x}^{n-1}\}$.
\qed


Before we move on, we need the following facts.
\begin{prop}\label{root}
Let $f(x) \in F[x]$ be a polynomial of degree $n$, then there are
at most $n$ roots in $F$.
\end{prop}

\begin{proof}
$a$ is said to be a root of $f(x)$ if $f(a)=0$. Note that, by
division algorithm, $f(x)=q(x) (x-a) +r(x)$ with $r(x)=0$ or
$deg(r(x)) =0$. $a$ is a root if and only if $r(x)=0$ if and only
if $(x-a) | f(x)$. Inductively and by the unique factorization of
$F[x]$. One sees that there are at most $n$ roots.
\end{proof}

\begin{prop}
Let $G < F^*$ be a finite group. Then $G$ is cyclic.
\end{prop}

\begin{proof}
By Corollary \ref{ftab}, $G \cong \bZ_{m_1} \oplus ... \oplus
\bZ_{m_d}$. Note that, on the right hand side, $m_d x = 0$ for all
$x$. Thus $a^{m_d} =1$ for all $a \in G$. ( On $G$, we use
multiplicative notations, while right hand side is additive). Thus
every element in $G$ is a root of $x^{m_d}-1$. So we have
$$ |G| = m_1 ... m_d  \le m_d.$$
This is possible only when $d=1$.
\end{proof}



\subsection{field extensions}

Let $K$ be a subfield of $F$, then we say that $F$ is an extension
over $K$ and denote it by $F/K$. Recall that $F$ can be viewed as
a vector space over $K$. We say that the extension $F/K$ is finite
of infinite according the dimension of $F$ as a vector space over
$K$.

Let $F/K$ be an extension, an element $u \in F$ is said to be {\it
algebraic} over $K$ if there is a non-zero polynomial $f(x) \in
K[x]$ such that $f(u)=0$. In other words, the ring homomorphism
$$\varphi: K[x] \to F ,$$
$$ f(x) \mapsto f(u)$$ has a non-zero kernel. Let $I$ be the
kernel. Since $K[x]$ is a PID, $I=(p(x))$ for some $p(x)$. Let
$K[u]$ be the image of $\varphi$, then $$ K[x]/(p(x)) \cong K[u]
\subset F .$$ It's easy that $(p(x))$ is a prime ideal, that is,
$p(x)$ is irreducible. We may assume that $p(x)$ has leading
coefficient $1$. Such $p(x)$ is called the minimal polynomial of
$u$ over $K$.

We say that $F/K$ is algebraic if every  element of $F$ is
algebraic over $K$.

Let's recall some more properties. If $F/K$, then we denote
$[F:K]$ to be  the dimension $ \dimm_K F$.

\begin{prop}
If $E/F$ and $F/K$, then $[E:F][F:K]=[E:K] $.
\end{prop}
\begin{proof}[Sketch of the proof]
Let $\{ u_i\} _{i \in I}$ be a basis of $E/F$ and  $\{ v_j\} _{j
\in J}$ be a basis of $F/K$. Then one can prove that $\{ u_i v_j\}
_{(i,j) \in I \times J}$ is a basis of $E/K$. Hence
$$[E:K]= | I \times J| = |I|\cdot |J| =[E:F]\cdot [F:K].$$
\end{proof}
\begin{prop}
Suppose that we have a tower of fields $K \subset F \subset E$.
Then $E$ is finite over $K$ if and only if $E$ is finite over $F$
and $F$ is finite over $K$.
\end{prop}

\begin{proof}
Easy corollary of the previous proposition.
\end{proof}

\begin{prop}
If $F/K$ is finite, then $F/K$ is algebraic.
\end{prop}

\begin{proof}
suppose that $[F:K]=n$.  For any $u \ne 0 \in F$, then
$\{1,u,...,u^n\}$ is linearly dependent over $K$. Thus there are
$a_0,...,a_n \in K$ non all zero such that $\sum_{i=0}^{n} a_i
u^i=0$. It follows that $u$ satisfies the polynomial $f(x)
=\sum_{i=0}^{n} a_i x^i \in K[x]$.
\end{proof}

Let $F/K$ be an extension, and $u \in F$. We denote by $K(u)$ the
smallest subfield of $F$ containing $K$ and $u$. It's easy to see
that $$K(u)=\{ \frac{f(u)}{g(u)}| f(x),g(x) \in K[x], g(u) \ne
0\}.$$ Similarly, for $S \subset F$, we denote by $K(S)$ the
smallest subfield containing both $K$ and $S$. If $F=K(S)$ for a
finite set $S$, then $F$ is said to be {\it finitely generated}
over $K$.



\begin{prop}
Let $F/K$ be an extension. Then $u \in F$ is algebraic over $K$ if
and only if $K(u)=K[u]$. And in the algebraic case, $[K[u]:K]=
deg(p(x))$, where $p(x)$ is the minimal polynomial.
\end{prop}

\begin{proof}[Sketch of the proof]
If $u \in F$ is algebraic over $K$, let $p(x)$ be the minimal
polynomial. One sees that $g(u) \ne 0$ if and only
$(g(x),p(x))=1$. There are $s(x),t(x)$ such that $$ 1=
s(x)g(x)+t(x)p(x),$$ hence $ 1= s(u) g(u)$. One has
$\frac{f(u)}{g(u)} = f(u)s(u)$ and hence $K(u) \subset K[u]$.

Conversely, $\frac{1}{u} \in K(u)=K[u]$. Thus $\frac{1}{u}=f(u)$
for some $f(x) \in K[x]$. One sees that $u$ satisfies $xf(x)-1$.
\end{proof}

\begin{prop}
$F/K$ is finite if and only if $F/K$ is finitely generated and
algebraic.
\end{prop}
\begin{proof}[Sketch of the proof]
If $F/K$ is finite, let $\{u_1,...,u_n\}$ be a basis of $F/K$,
then $F=K(u_1,...,u_n)$ hence is finitely generated.

Conversely, suppose that $F=K(u_1,...,u_n)$ is algebraic over $K$.
In particular, each $u_i$ is algebraic over $K$. In particular,
$u_1$ is algebraic over $K$, $u_2$ is algebraic over $K(u_1)$, and
so on. Then one has that
$$[K(u_1,...,u_n):K]=[K(u_1,...,u_n):K(u_1,...,u_{n-1})] \cdot [K(u_1,...,u_{n-1}):K]$$ is finite by induction.
\end{proof}

\begin{prop}
Suppose that we have a tower of fields $K \subset F \subset E$.
Then $E$ is algebraic  over $K$ if and only if $E$ is algebraic
over $F$ and $F$ is algebraic over $K$.
\end{prop}

\begin{proof}[Sketch of the proof]
We will only prove that $E$ is algebraic over $F$ and $F$ is
algebraic over $K$ implies that $E$ is algebraic over $K$. The
remaining statement are easy.

Pick any $u \in E$. Since $u$ is algebraic over $F$, let
$f(x)=\sum a_i x^i$ be the minimal polynomial of $u$ over $F$.

We then consider the field $F':=K(a_0,...,a_n)$. It's clear that
$u$ satisfies a polynomial $f(x) \in F'[x]$. It follows that $u
\in F'(u)$ which is finite over $K$. Therefore, $u$ is algebraic
over $K$.
\end{proof}

Let $L/K$ and $M/K$ are extensions over $K$ and both $L,M$ are
contained in a field $F$. We denote by $LM$ the smallest subfield
containing both $L$ and $M$. $LM$ is called the compositum of $L$
and $M$.

A useful remark is that if $L=K(S)$ for some $S \subset L$, then
$LM=M(S)$.

For a certain property of field extension, denoted $\mathcal{C}$,
we are interested whether $\mathcal{C}$ is preserved after
extension, lifting or compositum. More precisely, we would like to
know a property $\mathcal{C}$ satisfying the following conditions:

\begin{enumerate}
\item (extension) Both $E/F$ and $F/K$ are $\mathcal{C}$ if and
only if $E/K$ is $\mathcal{C}$.

\item (lifting/ base change) If $E/K$ is $\mathcal{C}$, then
$EF/F$ is $\mathcal{C}$.

\item (compositum) If both $E/K, F/K$ are $\mathcal{C}$, then
$EF/K$ is $\mathcal{C}$.
\end{enumerate}
\begin{prop}
The property of being finite or algebraic satisfying the above
three.
\end{prop}

\begin{proof}[Sketch of the proof]
It's easy to that being finite and finitely generated satisfies
the above three statement. Hence so does being algebraic.
\end{proof}


\begin{thm}
Let $F$ be an extension over $K$, and $E$ the set of all elements
in $F$ which is algebraic over $K$. Then $E$ is a field.
\end{thm}

\begin{proof}
If $u, v \in E$, we need to show that $u+v , uv \in E$. Note that
$u+v, uv \in K(u,v)$ and $K(u,v)/K$ is finitely generated and
algebraic, hence finite. It follows that both $u+v, uv$ are
algebraic over $K$.
\end{proof}

\begin{ex} \end{ex} Consider $\bC / \bQ$. A number $u \in \bC$
which is algebraic over $\bQ$ is called an algebraic number. The
set of all algebraic numbers, denoted $\mathcal{A}$, is a field,
algebraic but not finite over $\bQ$.

\vfill
 \pagebreak

\begin{center}
 Nov. 10, 2006 (Fri.)
\end{center}
\subsection{irreducibility}

One of the most important construction of field extension comes
from the extension of the form $K[x]/(p(x))$ with $p(x)$ an
irreducible polynomial. It is therefore natural to give some
criterion for irreducibility of polynomials.

\begin{thm}[Gauss' Lemma]
Let $D$ be a UFD, and $K$ be its field of quotients. Given a
polynomial $f(x) \in D[x]$. Then $f(x)$ is irreducible in  $D[x]$
if and only if $f(x)$ is irreducible in $K[x]$.
\end{thm}

\begin{proof}[Sketch]
{\bf 1.} $f(x)$ is irreducible in $K[x]$ then $f(x)$ is
irreducible in $D[x]$.

\noindent {\bf 2.} Given an irreducible $f(x) \in D[x]$. We may
assume that $f(x)$ is primitive, that is, the g.c.d of coefficient
is $1$.  If $f(x)=g(x) h(x) \in K[x]$, by clearing the
denominators, we have $ a f(x) =( b g(x))( c h(x) )$ with $a,b,c
\in K$ and $af(x), b g(x), cf(x) \in D[x]$ being primitive.

The main ingredient is:\\
\noindent {\bf 3.} In $D[x]$, if $s[x],t[x]$ are primitive, then
so is $s[x]t[x]$.

To see this, suppose that $d \ne 1$ is the g.c.d of coefficient of
$s[x]t[x]$. Let $p$ be a prime factor of $d$. We consider the ring
homomorphism $-: D[x] \to D/(p) [x]$. Then $$0=\overline
{s[x]t[x]} =(\overline {s[x]})( \overline {t[x]}) \ne 0.$$

\noindent {\bf 4.} It follows that $a f(x) \in D[x]$ is also
primitive. Write $a= \frac{q}{p}$ with $(p,q)=1$. It follows that
$p| (q a_0,...,q a_n) =q$, where $a_i$ are coefficients of $f(x)$.
This is the required contradiction.
\end{proof}

The following observation is easy but useful:
\begin{prop}
Let $f(x) \in D[x]$ be a monic polynomial, $\frak{p} \lhd d$ be a
prime ideal. We consider $-: D[x] \to D/\frak{p} [x]$. If
$\overline{f(x)}$ is irreducible in $D/\frak{p} [x]$, then $f(x)$
is irreducible in $D[x]$.
\end{prop}

\begin{ex} \end{ex}
Given $f(x) = x^2 + 517x +65535 \in \bZ[x]$, we may consider
$-:\bZ[x] \to \bZ_2[x]$. Then $\overline{f(x)}=x^2+x+1$ is
irreducible in $\bZ_2[x]$, hence irreducible in $\bZ[x]$. By
Gauss' Lemma, it's also irreducible in $\bQ[x]$. \qed

We also recall
\begin{prop}[Eisenstein's criterion]
Let $f(x) = a_n x^n + ...+ a_0 \in \bZ[x]$. If there is a prime
$p$ such that $p \nmid a_n, p|a_{n-1},...,p|a_0$, and $p^2
 \nmid a_0$. Then $f(x)$ is irreducible.
\end{prop}

\begin{proof}
If $f(x)= g(x) h(x)$, then we consider $-: \bZ[x] \to \bZ_p [x]$.
Thus $$ \overline{ a_n x^n} = \overline{f(x)} = \overline{ g(x)}
\overline{ h(x)}.$$ It follows that both $\overline{
g(x)},\overline{ h(x)}$ are of the form $\alpha x^m \in \bZ_p[x]$
with $m \ge 1$. Therefore, we may write $g(x) = b_m x^m
+...+b_0$,$f(x)= c_k x^k+...+c_0$ with $p | b_0, p |c_0$. Then
$p^2 | b_0 c_0 = a_0$, a contradiction.
\end{proof}

\subsection{algebraic closed fields and algebraic closure}
In this section, we are going to prove the existence and
uniqueness of algebraic closure. As a consequence, we are able to
show the existence and uniqueness of splitting fields.

To motivate the study of algebraic closure, we start with
examples:

\begin{ex} \end{ex}
Consider $\bQ[\root 3 \of 2]/\bQ$ and $\bQ[\root 3 \of 2 \omega] /
\bQ$. There is a isomorphism $\varphi: \bQ[\root 3 \of 2] \to
\bQ[\root 3 \of 2 \omega]$ with $\varphi( \root 3 \of 2) = \root 3
\of 2 \omega$, and $\varphi(a) =a$ for $ a \in \bQ$.

This follows from the natural isomorphism $ \bQ[x]/(x^3-2) \to
\bQ[\root 3 \of 2]$ and $\bQ[x]/(x^3-2) \to \bQ[\root 3 \of 2
\omega]$. \qed

In general, given a extension $F/K$,  if $u,v \in F$ are two roots
of an irreducible polynomial $p(x) \in K[x]$, then $K[u] \cong
K[v]$. Therefore, starting with a field $K$ and an irreducible
polynomial $p(x) \in K[x]$. It's convenient that we have a field
$F$ containing all roots of $p(x)$ in advance. Or even more, we
would like to have a field containing all roots of all polynomial
in $K[x]$.


\begin{prop}\label{algclosed} Let $F$ be a field.
The following are equivalent:

\begin{enumerate}
\item Every polynomial  of $F[x]$ of degree $\ge 1$  has a root in
$F$.

\item Every polynomial of $F[x]$ of degree $\ge 1$ has all the
roots in $F$.

\item Every irreducible polynomial in $F[x]$ has degree $\le 1$

\item If $E$ is an algebraic extension over $F$, then $E=F$.

\item There is a subfield $K \subset F$ such that $F$ is algebraic
over $K$ and every polynomial in $K[x]$ splits in $F[x]$.


\end{enumerate}

\end{prop}

\begin{defn}
A field $F$ satisfying above conditions is said to be
algebraically closed.
\end{defn}

\begin{proof}[Sketch]
$(1)\Rightarrow(2)$ by induction on degree. And hence
$(1)\Leftrightarrow(2)$ are equivalent. It's easy to see that $
(2) \Leftrightarrow (3)$. We now look at $(3)$ and $(4)$. If $ E$
is an algebraic extension. Pick $u \in E$ algebraic over $F$ with
minimal polynomial $p(x)$. By $(3)$, $p(x)$ has degree $1$, hence
$ [E:F]=deg(p(x))=1$. In particular, $E=F$. Conversely, if there
is an irreducible polynomial $p(x)$ of degree $>1$, then
$K[x]/(p(x))$ gives an algebraic extension of degree $deg(p(x))$.
This leads to a contradiction, hence $(4)$ implies $(3)$.

Lastly, it's clear that $(3)$ implies $(5)$ by picking $K=F$. We
now prove that $(5) \Rightarrow (4)$. Let $E$ be an algebraic
extension over $F$. For any $u \in E$, $u$ is algebraic over $K$
as well. Let $p_F(x), p_K(x)$ be the minimal polynomial of $u$
over $F,K$ respectively. By viewing $p_K(x)$ as a polynomial in
$F$, then one has $p_F(x)| p_K(x) \in F[x]$. However, $p_K(x)$
splits in $F[x]$. It follows that $p_F(x)$ has degree $1$. And
hence $u \in F$. Thus $E=F$.
\end{proof}

We can also define the notion of algebraic closure.

\begin{prop} Let $F/K$ be an extension.
The following are equivalent.
\begin{enumerate}
\item $F/K$ is algebraic, and $F$ is algebraically closed.

\item $F/K$ is algebraic, and every polynomial in $K[x]$ splits in
$F[x]$.

\item $F$ is a splitting field of all polynomials of $K$.
\end{enumerate}
\end{prop}

\begin{proof} The proof is an easy consequence of the Proposition \ref{algclosed},
we leave it to the readers.
\end{proof}

\begin{defn}
$F$ is said to be an algebraical closure of $K$ if $F/K$ satisfies
the  above conditions.
\end{defn}


\begin{thm}
Algebraic closure exists.
\end{thm}

The following is due to M. Artin as it appeared in [Lang,
Algebra].

\begin{proof} Let $K$ be a field.

{\bf Step 1.} There is an extension $E_1$ over $K$ such that every
polynomial of degree $\ge 1$ has a root in $E_1$.

To this end, let $S$ be the set of all polynomials of degree $\ge
1$. We consider $K[S]$ to be the polynomial ring with
indeterminates $x_f$, for $f \in S$. Consider now an ideal
$I=<f(x_f)>_{f \in S}$. We claim that $I \ne K[S]$, hence $I
\subset \frak{m}$ for some maximal ideal $\frak{m}$. The field
$K[S]/\frak{m}$ gives an extension $E_1$ over $K$. Now, for every
$f(x) \in K[x]$, one sees that
$f(\overline{x_f})=\overline{f(x_f)}=0 \in E$. Hence $f(x)$ has a
root $\overline{x_f}$ in $E_1$.

It remains to show that $I \ne K[S]$. Suppose on the contrary that
$I=K[S]$, in particular, $1 \in I$. We may write
$$ 1= \sum_{i=1}^r g(X) f_i(x_{f_i}).$$
One can construct an algebraic extension $F/K$ such that each
$f_i$ has a root $u_i$ in $F$. Substitute $x_{f_i}$ by $u_i$ in
$F$, one has
$$ 1 = \sum_{i=1}^r g(X) f_i(u_i)=0 \in F,$$
which is the required contradiction.

{\bf Step 2.} Inductively, one has $K=E_0 \subset E_1 \subset
E_2...$. Let $E = \cup E_i$, then $E$ is a field extension over
$K$. And $E$ is algebraically closed.

To see this, for any polynomial $f(x)=\sum a_i x^i \in E[x]$, $a_i
\in E_{j_i}$ for some $j_i$. One can pick $J$ maximal among $j_i$
so that $a_i \in E_J$ for all $i$. Hence $f(x) \in E_J$. By
construction, $f(x)$ has a root in $E_{J+1}$, and inductively,
$f(x)$ has all its root in $E_{J+d}$, where $d= deg(f(x))$.
Therefore, $f(x)$ has all its root in $E$.

{\bf Step 3.} Let $E_a:=\{ u \in E | u \text{ is algebraic over }
K\}$. Then $E_a$ is an algebraic closure of $K$.

It's an easy exercise to check that $E_a$ is a field extension
over $K$. We leave it to the readers. It's also clear that $E_a$
is algebraic over $K$. Hence, it suffices to check that $E_a$ is
algebraically closed.

To see this, one notices that every polynomial of $K[x]$ splits in
$E$ and it follows that every root of $K[x]$ is in $E_a$.
Therefore, one has that every polynomial of $K[x]$ splits in $E_a$
and we are done.
\end{proof}

\begin{rem}
An algebraically closed field must be infinite. \\
Suppose that $F$ is algebraically closed and $F= \{ a_1,..,a_n \ne
0\}$. We consider $f(x):= \prod (x-a_i) +a_n$. Then $f(x)$ has no
root in $F$, a contradiction.
\end{rem}

We next work on the uniqueness of algebraic closure. The main
ingredient is the following extension theorem.

\begin{thm}[Extension theorem]
Let $\sigma: K \to L$ be an embedding to an algebraically closed
field $L$. Let $E/K$ be an algebraic extension. Then one can
extend the embedding $\sigma$ to an embedding $\bar{\sigma}: E \to
L$. That is, there is an embedding $\bar{\sigma}: E \to L$ such
that $\bar{\sigma}|_K=\sigma$.
\end{thm}

We remark that $L$ is not necessarily an algebraic closure of $K$.
For example, $L$ could be something like $\overline{ K(x)}$, an
algebraic closure of $K(x)$.

In order to prove the uniqueness, we need the following useful
Lemma.

\begin{lem}
Let $E/K$ be an algebraic extension and $\sigma : E \to E$ be an
embedding such that $\sigma|_K={\bf 1}_K $. Then $\sigma$ is an
isomorphism.
\end{lem}

\begin{proof}
If $E/K$ is finite, then injective implies isomorphic in the case
of finite dimensional vector space.

In general, let's pick any $u \in E$. It suffices to show that $u$
is in the image of $\sigma$. To see this, let $p(x)$ be the
minimal polynomial of $u$ over $K$ and $u=u_1,u_2,...,u_r$ be the
roots of $p(x)$ in $E$. Let $E':=K(u_1,...,u_r)$. It's clear that
for each $i$, $\sigma(u_i)=u_j$ for some $j$. Hence $\sigma|_{E'}$
gives an homomorphism from $E'$ to $E'$.

Now $ \sigma|_{E'}: E' \to E'$ is an injective homomorphism of
finite dimensional vector space $E'/K$. Therefore, $\sigma|_{E'}$
is an isomorphism. In particular, $u$ is in the image of
$\sigma|_{E'}$ and therefore in the image of $\sigma$.
\end{proof}

\begin{proof}[Sketch of the theorem]
The staring point is an extension to a simple extension. More
precisely, let $u \in E$ be  algebraic over $K$ with minimal
polynomial $p(x)$. Then $p^\sigma(x)$ is an irreducible polynomial
in $\sigma(K)[x]$. In $L$, Pick any root $v$ of $p^\sigma(x)$ in
$\sigma(K)[x]$. This is possible  since $L$ is algebraically
closed. One claims that there is an isomorphism ( hence an
embedding to $L$)
$$ \bar{\sigma}: K(u) \to \sigma(K)(v) \subset L$$
extending $\sigma$. We leave the detail to the readers.

In order to work on the general case, we apply Zorn's Lemma to the
non-empty P.O. set of fields $$ S:=\{ (F, \tau)| K \subset F
\subset E,  \tau: F \to L, \tau|_K=\sigma\}.$$ The ordering is
given naturally as: $(F_1, \tau_1) \le (F_2, \tau_2)$ if $F_1
\subset F_2 $ and $\tau_1 = \tau_2|_{F_1}$.

By Zorn's Lemma, there is a maximal element, say $E_m$. It's easy
to see that $E_m=E$. Otherwise, pick any $u \in E$, which is
algebraic over $K$ and hence over $E_m$. There is an extension to
$E_m(u)$ as we have seen in the first paragraph. This is a
contradiction to the maximality of $E_m$. Hence $E_m=E$.
\end{proof}

\begin{lem}
Let $E/K$ be an algebraic extension and $\sigma : E \to E$ be an
embedding such that $\sigma|_K={\bf 1}_K $. Then $\sigma$ is an
isomorphism.
\end{lem}

\begin{proof}
If $E/K$ is finite, then injective implies isomorphic in the case
of finite dimensional vector space.

In general, let's pick any $u \in E$. It suffices to show that $u$
is in the image of $\sigma$. To see this, let $p(x)$ be the
minimal polynomial of $u$ over $K$ and $u=u_1,u_2,...,u_r$ be the
roots of $p(x)$ in $E$. Let $E':=K(u_1,...,u_r)$. It's clear that
for each $i$, $\sigma(u_i)=u_j$ for some $j$. Hence $\sigma|_{E'}$
gives an homomorphism from $E'$ to $E'$.

Now $ \sigma|_{E'}: E' \to E'$ is an injective homomorphism of
finite dimensional vector space $E'/K$. Therefore, $\sigma|_{E'}$
is an isomorphism. In particular, $u$ is in the image of
$\sigma|_{E'}$ and therefore in the image of $\sigma$.
\end{proof}

\begin{cor}
Algebraic closure of a field is unique up to isomorphism.
\end{cor}

\begin{proof}
Suppose  that $E, F$ are algebraic closure of $K$. By the
extension theorem, there are embedding $\sigma: E \to F$ and
$\tau: F \to E$ such that $\sigma|_K=\tau|_K={\bf 1}_K$.

Hence one has an embedding $\sigma \circ \tau: F \to F$, which is
an isomorphism by the Lemma. Similarly, $\tau \circ \sigma$ is an
isomorphism. Hence $E$ and $F$ are isomorphic.
\end{proof}



\vfill \pagebreak
\begin{center}
Nov. 17, 2006
\end{center}
\subsection{splitting fields and normal extensions}
We have seen that given a field $K$, there is a unique (up to
isomorphism) algebraic closure, denoted $\overline{K}$. Then it is
convenient for our further study of roots of polynomial. Even
though we do not know the roots explicitly, we know that there are
{\it in} its algebraic closure. This make the discussion of root
of polynomials more concrete.


Let $K$ be a field and $f(x) \in K[x]$. Let $\{u_1,...,u_r\}$ be
the roots of $f(x)$ in its algebraic closure $\overline{K}$. Then
the field $K(u_1,...,u_r)$ is called the {\bf splitting field of
$f(x)$ over $K$}. The splitting field is the smallest field that
containing all roots.

Given a set of polynomial $S \subset K[x]$, we can similarly
define the splitting field of $S$ to be the field generated by all
roots of polynomials in $S$.

In this section, we are going to prove the existence and
uniqueness of splitting fields. And we introduce the notion of
normal extension.

\begin{prop} Let $K$ be a field.
And $S$ be a set of polynomial in $K[x]$.  Then
\begin{enumerate}

\item Any two splitting field are isomorphic.

\item If $F_1,F_2$ are two splitting fields in a fixed algebraic
closure $\overline{K}$, then $F_1=F_2$.
\end{enumerate}
\end{prop}

\begin{proof}
Let $F_1$ and $F_2$ be two splitting fields, one has an
$K$-embedding $\sigma: K \to \overline{F_2}=\overline{K}$. This
embedding can be extended to $\tilde{\sigma}: F_1 \to
\overline{F_2}$ by the extension theorem. One can prove that image
of $\tilde{\sigma}$ is in $F_2$. Hence one has an injective
homomorphism $ \tilde{\sigma}: F_1 \to F_2$. Similarly there is
another one $\tilde{\tau} : F_2 \to F_1$. It's easy to show that
these give the isomorphism.
\end{proof}

\begin{prop} Let $N$ be an algebraic extension over $K$ contained
in $\overline{K}$. Then the following are equivalent:
\begin{enumerate}
\item Any $K$-embedding $\sigma: N \to \overline{K}$ induces an
$K$-automorphism of $N$.

\item $N$ is a splitting field of some $S \subset K[x]$ over $K$.

\item Every irreducible polynomial in $K[x]$ having a root in $N$
splits in $N$.
\end{enumerate}
\end{prop}

\begin{proof}
For $(1) \Rightarrow (2),(3)$, we prove that for every $u \in N$,
with minimal polynomial $p(x)$, then $ v \in N$ for every root of
$p(x)$. To this end, start with an isomorphism $\sigma:K(u) \to
K(v)$. By extension theorem, one can extend it to an embedding $N
\to \overline {K(v)}=\overline{K}$. The embedding is an
automorphism by $(1)$. Thus, $v=\sigma(u) \in N$.

$(3) \Rightarrow (2)$ is trivial.

For $(2) \Rightarrow (1)$. Suppose that $N$ is a splitting field
of $S$ over $K$. Let $u$ be a root of $f(x) \in S$. Let $\sigma: N
\to \overline{K}$ be any $K$-embedding. It's clear that
$\sigma(u)$ is a root of $f(x)$, hence $\sigma(u) \in N$. Thus
$\sigma(N) \subset N$. Since $\sigma$ is injective and $N/K$ is
algebraic, $\sigma$ is in fact an isomorphism.
\end{proof}

The property of being normal is not as well-behaved as begin
algebraic or finite. For example, it's not preserve after
"extension"

\begin{ex}
If $F/E$ and $E/K$ are normal, then $F/K$ is not necessarily
normal. For example, take $F=\Q(\sqrt[4]{2}),
E=\bQ(\sqrt{2}),K=\bQ$. It's easy to see that a degree $2$
extension is always normal, however, $\bQ(\sqrt[4]{2})$ is not
normal over $\bQ$.

Also let's consider $K \subset E \subset F$. Then $F$ is normal
over $K$ implies that $F$ is normal over $E$. But it doesn't imply
that $E$ is normal over $K$. For example, take $F=\bQ(\sqrt[4]{2},
i ), E=\bQ(\sqrt[4]{2}), K = \bQ$
\end{ex}

Being normal is preserved by "lifting" and "compositum"
\begin{prop} Let $E, F$ be extensions over $K$ and contained in a
field $L$.  If $E/K$ is normal then $EF/F$ is normal. Moreover, if
both $E/K,F/K$ are normal, then $EF/K$ is normal.
\end{prop}

\begin{proof}
In order to show that $EF$ is normal over $F$, we look at
$F$-embedding $\sigma : EF \to \overline{F}$. Since $\sigma$ is
identity on $F$, hence on $K$. By the extension theorem and the
proof of the previous Proposition, one can show that $\sigma_{|E}$
is an automorphism. Hence $\sigma(E)=E$. It follows that
$$\sigma(EF)=\sigma(E) F = EF.$$ Thus $EF$ is normal over $F$.

Suppose now that $E/K,F/K$ are normal. Let $\sigma: EF \to
\overline{K}$ be a $K$-embedding. We have that $\sigma_{|E},
\sigma_{|F}$ are $K$-embeddings. One sees that $\sigma(E)=E$ and
$\sigma(F)=F$ by the normal assumption. If follows that
$$ \sigma(EF)=\sigma(E) \sigma(F) = E F.$$

\end{proof}


\subsection{finite dimensional Galois extension}
In this section, we are going to prove the fundamental theorem for
finite dimensional Galois extension.

Let $F/K$ be an field extension, we define the Galois group of $F$
over $K$, denoted ${\rm Gal}_{F/K}$ or $G_{F/K}$ or ${\rm Aut}_K
(F)$, as
$$\gal_{ F/ K}:=\{\sigma| \sigma \in \Aut F, \sigma_{|K}={\bf 1}_K\}.$$

It's clear that for  $\sigma \in \gal_{F/K}$ and $u\in F$
algebraic over $K$ with minimal polynomial $p(x)$, then
$\sigma(u)$ satisfies the same minimal polynomial.

On the other hand, if $F/K$ is normal, let $u,v$ be two elements
having the same minimal polynomial $p(x)$, then we claim that
there is an $\sigma \in \gal_{F/K}$ such that $\sigma(u)=v$. To
see this, we fix an algebraic closure $\overline{K}$ containing
$F$. There is an  $K$-isomorphism $\sigma_0: K(u) \to K(v)$ which
extends to an embedding $\sigma: F \to \overline{K}$ . Since $F$
is normal over $K$, one has $\sigma(F) \subset F$. And hence
$\sigma \in \Aut F$.

\begin{ex} \label{x3-2} \end{ex}
Consider the field $F:=\bQ(\sqrt[3]{2}, \omega)$ which is a
splitting field of $x^3-2$ over $\bQ$. Thus it's normal over
$\bQ$. One can check that the Galois group $\gal_{F/\bQ}$ is
generated by $\sigma, \tau$ that $\sigma(\sqrt[3]{2})=\sqrt[3]{2}
\omega, \sigma(\omega)=\omega$, and
$\tau(\sqrt[3]{2})=\sqrt[3]{2}, \tau( \omega)=\omega^2$. It's easy
to check that $\gal_{F/\bQ} \cong S_3$. \qed

\begin{ex} \label{x3-2ngal}\end{ex}
Consider the field $F:=\bQ(\sqrt[3]{2})$ over $\bQ$. Then it's
easy to check that $\gal_{F/\bQ} = \{ \id_F\}$. \qed

There is a natural correspondence between subgroups of Galois
groups and intermediate fields. To be precise, fix an extension
$F/K$. Let $H < G:=\gal_{F/K}$ be a subgroup. One can define
$$ H':=\{ u \in F| \sigma(u)=u, \forall \sigma \in H\}.$$
It's clear that this is a field. On the other hand, given and
intermediate field $L$ such that $K \subset L \subset F$, then one
can define
$$ L':= \{ \sigma \in \gal_{F/K} | \sigma(u)=u, \forall u \in
L\}=\{ \sigma \in \gal_{F/K}| \sigma_{|L}=\id_L\}.$$

It's easy to check the following properties:
\begin{prop} Let $F/K$ be an extension with Galois group $G$.
Let $L$ be an intermediate field, i.e. $K \subset L \subset F$,
and $H <G$ is a subgroup.
\begin{enumerate}
\item $F'=\{\id_F\}$, $K'=G$, and $\{\id_F\}'=F$.

\item For any $L$, one has $L \subset L''$, $L'=L'''$.

\item For any $H$, one has $H < H''$, $H' = H'''$.

\item For any intermediate fields $L \subset M$, one has $M' <
L'$.

\item For any subgroups $J <H$, one has $H' \subset J'$.
\end{enumerate}
\end{prop}

\begin{proof}
Most of the proof follows directly from the definition. We only
sketch the proof for $L'=L'''$.

By $L \subset L''$ and $(4)$, one has
$$ (L'')^{'} < L'.$$
On the other hand, by $(5)$, one has
$$ L' < (L')^{''}.$$
We are done.
\end{proof}

\begin{prop}
There is a one-to-one correspondence between
$$\{L| K \subset L \subset F, L''=L\} \leftrightarrow \{ H | H <
G, H''=H\}.$$
\end{prop}

\begin{proof}
The correspondence is given by $L \mapsto L'$ (or $H \mapsto H'$).

To show the injective, one sees that if $L_1'=L_2'$, then
$L_1=L_1''=L_2''=L_2$.

For any $H$ with $H''=H$, we  take $L=H'$, then  $H=L'$. It
suffices to check that $L''=L$. This follows from the fact that
$H'''=H'$.
\end{proof}

In the proposition, one might expect that $G'=K$. However, this is
not always the case (see e.g. Example \ref{x3-2ngal}). For
extension with this property, we call it {\it Galois}. It turns
out that this naive definition is a very delicate one which leads
to some nice properties.

\begin{defn}
An extension $F/K$ is said to be Galois if $(\gal_{F/K})'=K$.
\end{defn}

\begin{ex} \end{ex} Keep the notation as in Example \ref{x3-2}.
One can check that $G'=\bQ$, hence a Galois extension.

In fact the group $G$ has the following subgroups: $\{ \id\},
<\tau>, <\tau \sigma>, <\tau \sigma^2>, <\sigma>, G$ of order
$1,2,2,2,3,6$ respectively. Their fixed fields are
$\bQ(\sqrt[3]{2}, \omega),\bQ(\sqrt[3]{2}), \bQ(\sqrt[3]{2}\omega)
,\bQ(\sqrt[3]{2}\omega^2), \bQ(\omega), \bQ$ respectively.

Conversely, for these intermediate subfields, their fixed groups
are exactly those corresponding ones. \qed

In general, we have the following:

\begin{thm}[Fundamental theorem of finite dimensional Galois
extension] Let $F/K$ be a finite dimensional Galois extension with
Galois group $G$, then
\begin{enumerate}
\item There is an one-to-one correspondence between $$\{ L| K
\subset L \subset F \} \leftrightarrow \{ H | H < G\}.$$

\item The corresponding degree are equal. That is, if $K \subset L
\subset M \subset F$, then $[M:L]=[L':M']$. And if $J < H <G$,
then $[H:J]=[J':H']$.

\item An intermediate field $E$ is Galois over $K$ if and only if
$E' \lhd G$. And in this case, $\gal_{E/K} \cong G/E'$.
\end{enumerate}
\end{thm}

\begin{proof}

{\bf Step 1.} $[M:L] \ge [L':M']$.\\
We prove the case that $M=L(u)$ for some $u \in M$ and by
induction on $[M:L]$, we are done. Suppose now that $M=L(u)$ and
let $p(x)$ be the minimal polynomial of $u$ over $L$. Let $S$ be
the set of roots of $p(x)$ in $F$. Then one has a map $$\Phi: L'
\to S,$$
$$ \sigma \mapsto \sigma(u).$$
One can check that $\Phi$ induces an injective map $L'/M' \to S$.
Hence one has
$$ [L':M']=|L'/M'| \le |S| \le deg(p(x)) = [M:L].$$

 {\bf Step 2.} $[H:J] \ge [J':H']$.\\
 Let $n=[H:J]$. Suppose on the contrary that there are  $n+1$ elements
 $u_1,...,u_{n+1} \in J'$ linearly independent over $H'$.

We consider the equation $\sum_{i=1}^{n+1} u_i x_i=0$ in $F$
 Consider now a set of representative of $H/J$, denoted
 $\{e=\sigma_1,...,\sigma_n\}$. By applying $\sigma_i$ to the above equation.
 Then one has a system of linear
 equations in $F$.
 $$(*) \left\{ \begin{array}{l}
\sigma_1(u_1)x_1+ \sigma_1 (u_2)x_2+...+
\sigma_1(u_{n+1}) x_{n+1}=0 \\
\sigma_2(u_1)x_1+ \sigma_2 (u_2)x_2+...+
\sigma_2(u_{n+1}) x_{n+1}=0 \\
\vdots\\
  \sigma_n(u_1)x_1+ \sigma_n (u_2)x_2+...+
\sigma_n(u_{n+1}) x_{n+1}=0 \\
 \end{array} \right.
$$


Pick a solution in $F$ with smallest number of non-zero $a_i$'s,
may assume it's $(a_1,...,a_s,0...,0)$ and $a_1=1$.

If there is an $\tau \in H$ such that $\tau(a_2) \ne a_2$, then by
applying $\tau$ to the system $(*)$, one get the same system of
equations with a solution
$(\tau(a_1),\tau(a_2),...,\tau(a_s),0,...,0$ . Hence
$$(a_1,...,a_s,0...,0)-(\tau(a_1),\tau(a_2),...,\tau(a_s),0,...,0)=(0,a_2-\tau(a_2),...,0)$$
is a non-zero solution of smaller length. This is the required
contradiction.

To find $\tau$. We look at $u_1 a_1+...+u_s a_s=0$. Since
$\{u_1,...,u_s\}$ is independent over $H'$, not all $a_1$ is in
$H'$. We may assume that $a_2 \not \in H'$. Hence there is a $\tau
\in H$ such that $\tau (a_2) \ne a_2$. We are done.

 {\bf Step 3.} We show that every intermediate field $L$,
$L''=L$. And every subgroup $H<G$, $H''=H$.

By Step 1, one has $$[L'':K]=[L'':K''] \le [K':L'] \le [L:K],$$
however, one has $L \subset L''$. Thus one has $L=L''$. Similarly,
one can prove that $H''=H$ by considering $[H'':\{\id_F\}]$.

{\bf Step 4.} $[M:L]=[L':M']$ and $[H:J]=[J':H']$.

This follows from $[M:L]=[M:K]/[L:K]=[K':M']/[K':L']=[L':M']$. And
the other one is similar.

{\bf Step 5.} $F/K$ is normal and separable.

Given $u \in F$, with minimal polynomial $p(x)$ over $K$. As in
the proof of Step 1. One has $ [K(u)':K'] \le |S| \le deg(p(x)) =
[K(u):K]$. By Step 4, they are equalities. In particular, every
root of $p(x)$ is in $F$ and there is no multiple roots. Thus $F$
is normal and separable over $K$.


{\bf Step 6.} If $N \lhd G$, then $N'$ is stable. That is, for all
$\sigma \in G$, $\sigma(N') \subset N'$ (indeed $=N'$).

Since $N \lhd G$, for all $\sigma \in G$ and for all $\tau \in N$,
one has $\sigma^{-1} \tau \sigma \in N$. Thus, $\sigma^{-1} \tau
\sigma (N') =N'$. It follows that $\tau \sigma (N') = \sigma(N')$,
for all $\tau \in N$. Hence $\sigma(N')$ is fixed by all $N$ and
thus $\sigma(N') \subset N'$.

{\bf Step 7.} If $E$ is a stable intermediate subfield. Then the
restriction map $\gal_{F/K} \to \gal_{E/K}$ is well-defined  and
surjective.

Since $E$ is stable, then $\sigma_{|E} \in \gal_{E/K}$ for any
$\sigma \in \gal_{F/K}$. Moreover, let $\tau \in \gal_{E/K}$, by
the extension theorem, there is an extension $\overline{\tau}: F
\to \overline{K}$. Since $F$ is normal over $K$, $\overline{\tau}$
is in fact an automorphism of $F$.

{\bf Step 8.} If an intermediate field $E$ is stable, then $E/K$
is Galois.

To see this, it suffices to show that for any $u \in E -K$, there
is an $\sigma \in \gal_{E/K}$ such that $\sigma(u) \ne u$. Fix any
$F \ni v \ne u$ with the same minimal polynomial as $u$. There is
an $K$-isomorphism $\sigma_0: K(u) \to K(v)$ such that
$\sigma(u)=v$. $\sigma$ can be extended to an embedding
$\overline{\sigma}: F \to \overline{K}$, which gives an
automorphism of $F$. The restriction
$\sigma=\overline{\sigma}_{|E}$ gives an automorphism of $E$ that
$\sigma(u) \ne u$.

{\bf Step 9.} If $E/K$ is Galois, then $E$ is stable.

One first notices that  $E/K$ is normal. For  every $\sigma \in
\gal_{F/K}$, $\sigma$ gives an embedding $\sigma_{|E}:E \to
\overline{K}$. Since $E/K$ is normal, $\sigma_{|E}$ is an
automorphism of $E$. And hence $E$ is stable under the Galois
group $\gal_{F/K}$ action.

{\bf Step 10.} If $E$ is stable, then $E'$ is normal.

This can be checked directly. For all $\sigma \in G$ and $\tau \in
E'$ and for all $u \in E$, $$\sigma^{-1} \tau \sigma (u)=
\sigma^{-1} \tau ( \sigma (u)) =\sigma^{-1} \sigma (u) =u,$$ since
$\sigma(u) \in E$. Therefore, $\sigma^{-1} \tau \sigma \in E'$.
\end{proof}

\vfill \pagebreak
\begin{center}
Dec. 1, 2006
\end{center}

\begin{rem}
Some of the result we proved still true in a more general setting.
We list some here:
\begin{enumerate}
\item If $F/K$ is an extension, and an intermediate field $E$ is
stable, then $E' \lhd \gal_{F/K}$.

\item Let $F/K$ be an extension. If $N \lhd \gal_{F/K}$, then $H'$
is stable.

\item If $F/K$ is Galois, and $E$ is a stable intermediate field,
then $E$ is Galois over $K$. (finite-dimensional assumption is
unnecessary here)

\item An intermediate field $E$ is algebraic and Galois over $K$,
then $E$ is stable.
\end{enumerate}
\end{rem}

We conclude this section with the following theorem concerning the
relation between Galois extension, normal extension and splitting
fields.

\begin{defn}
An irreducible polynomial $f(x) \in K[x]$ is said to be {\bf
separable} if its roots are all distinct in $\overline{K}$.

Let $F$ be an extension over $K$ and $u \in F$ is algebraic over
$K$. Then $u$ is separable over $K$ if its minimal polynomial is
separable.

An extesnion $F$ over $K$ is separable if every  element of $F$ is
separable over $K$.
\end{defn}
\begin{thm}
Let $F/K$ be an extension, then the following are equivalent
\begin{enumerate}
\item $F$ is algebraic and Galois over $K$.

\item $F$ is separable over $K$ and $F$ is a splitting field over
$K$ of a set $S$ of polynomials.

\item $F$ is a splitting field of separable polynomials in $K[X]$.

\item $F/K$ is normal and separable.
\end{enumerate}
\end{thm}
\begin{proof}
Fix $u \in F$ with minimal polynomail $p(x)$ over $K$. Let
$\{u=u_1,...,u_r\}$ be distinct roots of $p(x)$ in $F$. For any
$\sigma$, then $\sigma$ permutes $\{u=u_1,...,u_r\}$. Thus
$f(x):=\prod_{i=1}^{r} (x-u_i)$ is invariant under $\sigma$. Hence
$f(x) \in K[x]$. It follows that $f(x)=p(x)$. This proved that
$(1)\Rightarrow (2),(3),(4)$.

One notices that $(2)\Leftrightarrow (4)$. Thus it remains to show
that $(2)\Rightarrow (3)$, and $(3)\Rightarrow (1)$.

For $(2)\Rightarrow (3)$, let $f(x) \in S$ and let $g(x)$ be an
monic irreducible component of $f(x)$. Since $f(x)$ splits in $F$,
it's clear that $g(x)$ is an minimal polynomial of some element in
$F$. Moreover, since $F/K$ is separable, $g(x)$ is separable. One
sees that $F$ is in fact a splitting field of such $g(x)$'s.

For $(3)\Rightarrow (1)$, we first note that $F/K$ is algebraic
since $F$ is a splitting field. We shall prove that $(4)
\Rightarrow (1)$. The implication $(3) \rightarrow (4)$ follows
from a general fact about separable extension that an algebraic
extension $F/K$ is separable if $F$ is generated by separable
elements.

To this end, pick any $u \in F-K$, with minimal polynomial $p(x)$
of degree $\ge 2$ and separable. Hence there is a different root,
say $v$, of $p(x)$ in $F$. It's natural to consider the
$K$-isomorphism $\sigma: K(u) \to K(v)$. Which can be extended to
$\bar{\sigma}:F \to \overline{K}$. Since $F$ is normal,
$\bar{\sigma}$ is an automorphism of $F$, hence in $\gal_{F/K}$
sending $u$ to $v \ne u$. So $F/K$ is Galois.

\end{proof}

\subsection{Galois group of a polynomial}
In this section, we are going to study Galois group of a polynomial.
We will define this notion in general and study polynomial of degree 3,4 in more detail.

\begin{defn}
Let $f \in K[x]$ be a polynomial with splitting field $F$. The Galois group of $f(x)$,
denoted $G_f$ is the Galois group of $F/K$.
\end{defn}

The Galois group of a polynomial have some basic properties.
\begin{prop}
Let $f(x)$ be a polynomial of degree $n$, then $G_f \hookrightarrow S_n$.
Thus one can viewed $G_f$ as a subgroup of $S_n$.

If $f(x)$ is irreducible and separable, then $G_f$ is transitive and $|G_f|$ is divided by $n$.
\end{prop}

\begin{proof}[Sketch of the proof]
Let $\{u_1,...,u_r\}$ be roots of $f(x)$ in $F$. For $\sigma \in
G_f$, $\sigma(u_i)=u_j$. Hence $\sigma$ gives a permutation of $r$
elements. It follows that $G_f$ can be viewed as a subgroup of
$S_r$ hence $S_n$.

($r $ could possibly less than $n$ because there might have multiple roots in general).

Now if $f(x)$ is  separable. Then we have distinct roots
$\{u_1,...,u_n\}$ in $F$. For any $u_i$, we have $K[u_i] \cong
K[x]/(f(x))$ since $f(x)$ is irreducible. If follows that there is
a $K$-isomorphism $\sigma: K[u_i] \to K[x]/(f(x)) \to K[u_j]$ for
all $i ,j$. $sigma$ gives an $K$-embedding $K[u_i] \to
\overline{K[u_j]}=\overline{K}$ and extended to a $K$-embedding $
\bar{\sigma} :F \to \overline{K}$. Since $F$ is normal,
$\bar{\sigma} (F) = F$ (cf. Theorem ?). Thus $\bar{\sigma} \in
G_f$ and $\bar{\sigma}(u_i) = \sigma(u_i)=u_j$. Therefore, $G_f$
is transitive.

Moreover, since $K \subset K[u_i] \subset F$. So $|G_f|=[F:K] = [F:K[u_i]] n$ is divided by $n$.
\end{proof}

So now, we discuss irreducible separable polynomials of small degree.
One might wondering how do we know a polynomial is separable or not. We have the following easy criteria:

\begin{prop} Let $f(x) \in K[x]$ be an irreducible polynomial
The following are equivalent:\\
$1$. $f(x)$ is separable. \\
$2$. $(f(x),f'(x))=1$ in $ \overline{K}[x]$\\
$3$. $(f(x),f'(x))=1$ in ${K}[x]$\\
$4$. $f'(x) \ne 0$

Recall that when $f(x)=\sum a_ix^i$, then $f'(x)$ is its formal
differentiation which is $f'(x):= \sum i a_i x^{i-1}$.
\end{prop}

\begin{proof}
If $f(x)$ is separable, then $f(x)= \prod_{i=1}^n (x-u_i)$ with
distinct $u_i$ in $\overline{K}[x]$. Thus $f'(x) =\sum
\frac{\prod_{i=1}^n (x-u_i)}{x-u_i}$. If $(f(x),f'(x)) \ne 1$ in
$\overline{K}[x]$, then $x-u_i | f'(x)$ for some $i$. However,
$f'(u_i) = \prod_{j \ne i} (u_j-u_i) \ne 0$, a contradiction.

Conversely, if $f(x)$ is not separable, then $ f(x)= \prod_{i=1}^r
(x-u_i)^{a_i}$ with some $a_i \ge 2$. Let's say $a_1 \ge 2$. Then
it's clear that $(x-u_1)$ is a factor of $f'(x)$ as well. Hence
$(f(x),f'(x)) \ne 1$. This proved the equivalence of $(1)$ and
$(2)$.

To see the equivalence of $(2)$ and $(3)$. Note that if
$(f(x),f'(x))=1$ in ${K}[x]$, then $1= f(x)s(x) + f'(x)t(x)$ for
some $s(x),t(x) \in K[x]$. One can view this in $\overline{K}[x]$
and thus conclude that $ (f(x),f'(x))=1$ in $\overline{K}[x]$. On
the other hand, if $(f(x),f'(x))=d(x) \ne 1$ in ${K}[x]$, then
$d(x)= f(x)s(x) + f'(x)t(x)$ for some $s(x),t(x) \in K[x]$. One
can view this in $\overline{K}[x]$ and thus conclude that $ d(x)|
(f(x),f'(x))$ in $\overline{K}[x]$. In particular, $(f(x),f'(x))
\ne 1$ in $\overline{K}[x]$

Now finally, since $f(x)$ is irreducible, $(f(x),f'(x))$ could
only be $1$ or $f(x)$. Since $f(x)|f'(x)$ if and only $f'(x)=0$.
Thus we are done.
\end{proof}

One notice that if $\chr K  \ne 0$, then an irreducible polynomial
is always separable. When $\chr K =p$, then an irreducible
polynomial $f(x)$ is not separable if and only $f(x)=g(x^p)$ for
some $g(x)$.

One can go a little bit further. If $K$ is finite field with $\chr
K =p$. Let $f(x)=\sum a_i x^i$ be an irreducible polynomial.
$f'(x)=0$ means that $p | i $ for all $a_i \ne 0$. Thus $f(x)$ can
be rewrite as $\sum a_i x^{ip}$. Recall that each $a_i$ can be
written as $b_i^p$ for some $b_i$ because $K$ is finite. Thus
$f(x) = \sum b_i^p x^{ip} = (\sum b_i x^i )^p$. This contradicts
to $f(x)$ being irreducible. To sum up, an irreducible polynomial
over a finite field is always separable.

Let's now turn back to the discussion of Galois groups. If $f(x)$
is irreducible and separable of degree $2$, then $G_f \cong S_2
\cong \bZ_2$. If $f(x)$ is irreducible and separable of degree
$3$, then  $G_f$ is a subgroup of $S_3$ of order divided by $3$.
Thus $G_f$ could be $A_3$ or $S_3$. The question now is how to
distinguish these two cases.

\begin{lem} $(\chr K \ne 2)$
Let $f(x) \in K[x]$ be an irreducible and separable polynomial of degree $3$
with splitting field $F$ and roots $u_1,u_2,u_3$. Then $(G_f \cap A_3)¡¦ = K[\Delta]$,
where $\Delta:= (u_1-u_2)(u_1-u_3)(u_2-u_3)$
 \end{lem}

Note that $f(x)$ is irreducible and separable, then $F/K$ is
Galois. And $\Delta^2$ is invariant under $G_f$. Thus $D:=
\Delta^2 \in K$. We call $D$ the discriminant of $f(x)$.

If $f(x)$ is written as $x^3+bx^2+cx+d$, then
$s_1:=u_1+u_2+u_3=-b$, $s_2:=u_1u_2+u_1u_3+u_2u_3=c$,
$s_3:=u_1u_2u_3= -d$. We impose an ordering $u_1 > u_2 > u_3$.
Then leading term of $D$ is $u_1^4u_2^2$, which is the leading
term of $s_1^2 s_2^2$. Then we consider $D':=D-s_1^2 s_2^2$ with
lower leading term, which is $-4 u_1^3u_2^3$. This leading term is
the same as the leading term of $-4 s_2^3$. So we consider
$D^{(2)}:=D'+4 s_2^3$. Inductively, one can write $D$ in terms of
$s_1,s_2,s_3$, hence in terms of $b,c,d$.

If $f(x)$ is normalized as $x^3+px+q$, then $D=-4p^3-27q^2$.

\begin{proof}
 $\sigma (\Delta)= \Delta$ if and only $\sigma$ is an even
permutation. So  $\Delta \in (G_f \cap A_3)'$ clearly. Hence we
have $ K[\Delta] <(G_f \cap A_3)'$. Thus $ K[\Delta]' >(G_f \cap
A_3)$. If $\sigma \in K[\Delta]'$,  then $\sigma(\Delta)=\Delta$,
hence $\sigma$ is even. Thus $ K[\Delta]'< (G_f \cap A_3)$. So we
have $ K[\Delta]'= (G_f \cap A_3)$ and $ K[\Delta]=(G_f \cap
A_3)'$.
\end{proof}

We thus conclude that $G_f =A_3$ if and only if $D_f$ is square in $K$.
And  $G_f =S_3$ if and only if $D_f$ is not a square in $K$

\begin{ex} \end{ex}Let $f(x)=x^3+x+1 \in \bQ[x]$. It's
irreducible.


Now we consider the case of degree $4$ polynomial. One can also define $\Delta$ and discriminant $D$ similarly.
However, it turns out that this is not enough to classify all cases.
The idea is to consider another normal subgroup $V_4 \lhd S_4$.

Let's first list at all possible subgroup in $S_4$. Since $G_f$ is
transitive with order divided by $4$. We can have following
$$ \begin{array}{cccc}
|G_f| & G_f & G_f \cap V_4 & |G_f|/|G_f \cap V_4| \\
\hline
24 & S_4 & V_4 & 6 \\
12 & A_4 & V_4 & 3 \\
8 & \cong D_8 & V_4 & 2 \\
4 & \cong \bZ_4 & \ne V_4 & 2 \\
4 & V_4 & V_4 & 1 \\
\end{array}
$$
Also we have the following
\begin{lem}
Let $f(x)$ be an irreducible separable polynomial of degree $4$ with splitting field $F$ and roots $u_1,¡K,u_4$.
Let $\alpha=u_1u_2+u_3u_4$ $\beta= u_1u_3+u_2u_4$, $\gamma=u_1u_4+u_2u_3$.
Then $K[\alpha,\beta,\gamma] = (G_f \cap V_4)¡¦$.
\end{lem}

Let $g(x)=(x-\alpha)(x-\beta)(x-\gamma)$, then one can check that
$\sigma(g(x)= g(x)$ for all $\sigma \in G_f$. Thus $g(x) \in K[x]$
for $F/K$ is Galois. The cubic $g(x)$ is call the {\bf resolvant
cubic} of $f(x)$. If $f(x)= x^4+bx^3+cx^2+dx+e$, then its
resolvant cubic is $g(x)= x^3-c x^2+ (bd-4e)x-b^2e+4ce-d^2$ by
computation on symmetric polynomials as we exhibited.

\begin{proof}
It clear that $ K[\alpha,\beta,\gamma] < (G_f \cap V_4)'$. Hence
we have $(G_f \cap V_4) < K[\alpha,\beta,\gamma]'$. Now if $\sigma
\in K[\alpha,\beta,\gamma]'$ and $\sigma \ni V_4$. We claim that
this would lead to a contradiction. And thus we are done.

The claim can be verified directly by exhausting all cases.
For example, if $\sigma = (1,3)$, then
$\sigma (\alpha)=\alpha$ gives $u_3u_2+u_1u_4= u_1u_2+u_3u_4$.
Thus $(u_2-u_4)(u_1-u_3)=0$ contradict to reparability of $f(x)$. The other cases can be computed similarly.

\end{proof}

Let $m:=|G_f|/|G_f \cap V_4| = [K[\alpha,\beta,\gamma] : K ] $.
By using this correspondence, one sees that:\\
1. $m=1 \Leftrightarrow G_f = V_4  \Leftrightarrow $ $g(x)$ splits into linear factors in $K[x]$. \\
2. $m=3 \Leftrightarrow G_f = A_4  \Leftrightarrow $ $g(x)$ is irreducible in $K[x]$ and $D_g$ is a square in $K$.\\
3. $m=6 \Leftrightarrow G_f = S_4  \Leftrightarrow $ $g(x)$ is
irreducible in $K[x]$ and $D_g$ is not a square in $K$.

The only remaining unclear case is $m=2$. This case corresponding to the case
that $g(x)$ splits into a linear and a quadratic factors in $K[x]$.
To see the Galois group, we claim that $G_f \cong D_8$ if and only if
$f(x)$ is irreducible in $K[\alpha,\beta,\gamma][x]$.

First of all, if $f(x)$ is irreducible in $K[\alpha,\beta,\gamma][x]$, then
$$ 4 = [ K[\alpha,\beta,\gamma] [u_1] : K[\alpha,\beta,\gamma] ]
\le [F : K[\alpha,\beta,\gamma] ] =|G_f \cap V_4|.$$ So $G_f \cong D_8$.

On the other hand, $F$ is the splitting field of $f(x)$ over $
K[\alpha,\beta,\gamma]$ as well. Suppose that $f(x)$ is reducible.
If $f(x)$ factors into a linear  and a cubic factor in $
K[\alpha,\beta,\gamma]$, then the Galois group of $f(x)$ over $
K[\alpha,\beta,\gamma]$, which is $G_f \cap V_4$, can only $\cong
A_3$ or $S_3$. This is a contradiction. Running over all cases,
one sees that the only possible case is $f(x)$ factors into two
linear and one quadratic factors. Thus $ |G_f \cap V_4 |=2$ and
hence $G_f \cong \bZ_4$.


\vfill \pagebreak
\begin{center}
Dec. 8, 2006
\end{center}


\subsection{finite fields}
The Galois theory on finite fields is comparatively easy and
basically governed by Frobenius map.

Recall that given a finite field $F$ of $q$ elements, it's prime
field must be of the form $\bF_p$ for some prime $p$. Let $n=[F:
\bF_p]$, then $|F|=p^n$.

\begin{thm}
$F$ is a finite field with $p^n$ elements if and only if $F$ is a
splitting field of $x^{p^n}-x$ over $\bF_p$.
\end{thm}

\begin{proof}[Sketch.] Recall that $F^*$ is a multiplicative group of order
$p^n-1$. Hence it's easy to see that every element $u \in F$
satisfying $x^{p^n}-x$. Thus element of $F$ are exactly roots of
$x^{p^n}-x$, therefore, $F$ is a splitting field of $x^{p^n}-x$
over $\bF_p$.

Conversely, if $F$ is a splitting field of $x^{p^n}-x$ over
$\bF_p$. Let $E \subset F$ be the subset of all roots of
$x^{p^n}-x$. One can check that $E$ is a subfield (containing
$\bF_p$ and all roots). By definition of splitting field, $E$ is a
splitting field, and $E=F$. So $|F|=|E| \le p^n$. However, notice
that $x^{p^n}-x$ is separable. So $|F|=p^n$.
\end{proof}

\begin{prop}
Let $F$ be a finite field and $F/K$ is an extension. Then $F/K$ is
Galois. The Galois group is cyclic, generated by Frobenius map.
\end{prop}

\begin{proof}
We shall prove the case that $K=\bF_p$. For general $K$, $\bF_p
\subset K \subset F$. Since $F/ \bF_p$ is Galois, then $F/K$ is
also Galois with Galois group $K' < \gal_{\bF_p}F$ also a cyclic
group.

Now we consider $F/ \bF_p$, and $|F|=p^n$. Since $F$ is a
splitting field of a separable polynomial $x^{p^n}-x$ over
$\bF_p$, $F$ is Galois over $\bF_p$.

The Galois group $\gal_{\bF_p}F$ has order $[F:\bF_p]=n$. Consider
the Frobenius map $\varphi: a \to a^p$, which is clearly a
$\bF_p$-automorphism. So $\varphi \in \gal_{\bF_p} F$. Note that
order of $\varphi$ is $n$. So $\gal_{\bF_p} F$ can only be the
cyclic group generated by $\varphi$.
\end{proof}

\subsection{cyclotomic extension}

We now start the study of cyclotomic extension.
\begin{defn}
A cyclotomic extension of order $n$ over $K$ is a splitting field
of $x^n-1$.
\end{defn}

\begin{rem}
If $char(K)=p$ and $n=p^rm$, then $x^n-1=(x^m-1)^{p^r}$. Hence we
may assume that either $char(K)=0$ or $char(K)=p \nmid n$ in the
study of cyclotomic extension.
\end{rem}

The main theorem is the following:
\begin{thm}
Keep the notation as above. Then we have
\begin{enumerate}
\item $F=K(\zeta)$, where $\zeta$ is a primitive $n$-th root of
unity.

\item $F/K$ is Galois whose Galois group $\gal_{F/K}$ can be
identified as a subgroup of $\ZZ_n^*$.

\item If $n$ is prime, then $\gal_{F/K}$ is cyclic. More general,
is $n=p^k$ with $p \ne 2$, then then $\gal_{F/K}$ is cyclic.
\end{enumerate}
\end{thm}

\begin{proof}
Let $S:=\{u \in F| u^n=1\}$. And let $n'$ be the maximal order of
elements in $S$. Clearly, $n' \le n$  It's clear that $S$ is an
abelian multiplicative group. Therefore, it's easy to see that
order of elements in $S$ divides $n'$. It follows that $u^{n'}=1$
for all $u \in S$. Hence $|S| \le n'$.

Since we assume that $(n, \chr(K))=1$, therefore $x^n-1$ is
separable. It follows that  roots of $x^n-1$ are all distinct,
hence $|S|=n$. One sees that $n=n'$, therefore, there are elements
of order $n$ in $S$, denoted $\zeta$. It follows that
$F=K(S)=K(\zeta)$.

For any $\sigma \in \gal_{F/K}$, $\sigma(\zeta) \in S$. Hence
$\sigma(\zeta)=\zeta^i$ for some $i$. Therefore, we have a natural
map $\phi: \gal_{F/K} \to \ZZ_n$ by $\phi(\sigma)=i$ if
$\sigma(\zeta)=\zeta^i$. Note that if $\zeta^i$ is not a primitive
$n$-th root of unity, then $K(\zeta^i) $ is not the splitting
field of $x^n-1$, hence not equal to $K(\zeta)$, which is absurd.
Thus sigma we conclude that $\zeta^i$ is a primitive $n$-th root
of unity.   It's easy to see that this is equivalent to $(i,n)=1$.
Thus  $\phi: \gal_{F/K} \to \ZZ_n^*$ is an injective group
homomorphism.

Lastly, if $n=p^k$ with $p \ne 2$ or if $n=2,4$, then $\ZZ_n^*$ is
cyclic. Hence every subgroup is cyclic.
\end{proof}

The structure of cyclotomic extension is thus determined by the
primitive $n$-th root of unity. It's then natural to ask the
degree of such extension and their minimal polynomials.

\begin{defn}
If $\chr K \nmid n$, then the $n$-th {\bf cyclotomic polynomial}
over $K$ is defined as:
$$g_n(x):= \prod_{\zeta_i: \text{ prim. $n$-th root of 1}}
(x-\zeta_i).$$
\end{defn}

\begin{prop}
We have the following:\\
\noindent $1$. $x^n-1 = \prod_{d|n} g_d(x)$.\\
\noindent $2$. $g_n(X) \in P[x]$, where $P$ denoted the prime
field. Moreover, if $\chr K=0$, we identify $P= \bQ$, then $g_n(x)
\in
\bZ[x]$.\\
 \noindent $3$. $deg( g_n(x))= \varphi(n)$, where $\varphi$ denotes
 the Euler $\phi$-function.
\end{prop}

\begin{proof}
$(3)$ is clear from the definition.

For $(1)$, we consider the following decomposition of sets $$ \{
\zeta^i\}_{i=0,...,n-1} = \cup_{d|n} \{ \zeta^i| o(\zeta^i)=d\}.$$
Note that $ o(\zeta^i)=d$ implies that $\zeta^i$ is a primitive
$d$-th root of unity. Thus we define $g'_d(x):=
\prod_{o(\zeta^i)=d} (x-\zeta^i)$,  and  then  $g'_d(x)  |
g_d(x).$ By the decomposition, we have
$$ x^n-1= \prod_{i=0,...,n-1} (x- \zeta^i) = \prod_{d|n}
g'_d(x).$$ Computing degrees, we have $$ n = \sum_{d|n} deg(
g'_d(x)) \le \sum_{d|n} deg(g_d(x)) = \sum_{d|n} \varphi(d) =n.$$
Therefore, $g'_d(x)=g_d(x)$.

To see $(2)$, we prove by induction on $n$. We assume that $g_d(x)
\in P[x]$ for all $d < n$. We can write $x^n-1 = g_n(x) f(x) \in
F[x]$. In $P[x]$, we have $x^n-1 = f(x)q(x) +r(x)$ by the division
algorithm. We shall prove that $r(x)=0$ and thus $g_n(x)=q(x) \in
P[x]$ by the unique factorization of $F[x]$.

It suffices to show that $r(x)=0$. To this end, note that $f(x) |
x^n-1$  in $F[x]$, and thus $f(x) | r(x)$ in $F[x]$. However,
$deg(r(x)) < deg(f(x))$ unless $r(x)=0$. This completes the proof
of $(2)$.

When $\chr(K)=0$, similar inductive argument plus Gauss Lemma will
work. We leave it to the readers.
\end{proof}

Finally, if $K= \bQ$ then the cyclotomic extension behave even
nicer.

\begin{prop}
$F=\bQ(\zeta)$ be the $n$-th cyclotomic extension over $\bQ$.
Then\\
\noindent $1$. $g_n(x)$ is irreducible.\\
\noindent $2$. $[F:\ bQ] = \varphi(n)$.\\
\noindent $3$. $\gal_\bQ F \cong \bZ^*_n$.\\
\end{prop}

\begin{ex}
\end{ex}
Consider the $3$-rd cyclotomic extension over $\bF_7$. Then
$g_3(x) = \frac{x^3-1}{x-1} = (x-2)(x-4)$ is not irreducible. \qed

\begin{proof}
Asuuming $(1)$, then $F=\bQ[\zeta]$ is generated by $\zeta$, where
minimal polynomial of $\zeta$ over $\bQ$ is $g_n(x)$. Thus
$[\bQ[\zeta]: \bQ]= deg(g_n(x)) = \varphi(n)$. Morover, for every
$i \in \bZ^*_n$, the map $\zeta \mapsto \zeta^i$ produces an
$\bQ$-automorphism of $F$. Thus $(3)$ follows.

It thus suffices to prove $(1)$. Recall that $g_n(x) \in \bZ[x]$.
If $g_n(x)= f(x) h(x) \in \bZ[x]$, where $f(x)$ is an irreducible
polynomial with $f(\zeta)=0$. We claim that $\zeta^p$ is also a
root of $f(x)$ for all $(p,n)=1$. Grant this claim, then by this
process, we can conclude that $\zeta^i$ is a root of $f(x)$ for
all $(i,n)=1$. Therefore, $f(x)=g_n(x)$ is irreducible.

We now prove the claim. Suppose on the contrary that $\zeta^p$ is
not a root of $f(x)$. Then it's a root of $h(x)$. We have
$h(\zeta^p)=0$. Hence $\zeta$ is a root of $h(x^p)$. Since $f(x)$
is irreducible, it's minimal polynomial of $\zeta$ over $\bQ$. We
have $f(x) | h(x^p)$. Thus we can write $h(x^p)=f(x)k(x)$ for some
$k(x)$ in $\bQ[x]$. By Gauss' Lemma, this equation holds in fact
in $\bZ[x]$. We now consider ring homomorphism $\bar: \bZ[x] \to
\bZ_p[x]$. Then
$$ (\overline{h(x)})^p = \overline{ h(x^p)} = \overline{f(x)}
\overline {k(x)}.$$ Thus $g.c.d(\overline{h(x)},\overline{h(x)})
\ne 1 $ in $\bZ_p[x]$. It follows that $$\overline{x^n-1}
=\overline{ (
\frac{x^n-1}{g_n(x)})}\overline{f(x)}\overline{h(x)}$$ has
multiple roots. But $\overline{x^n-1}'=n\bar{x}^{n-1} \ne 0$. So
this is the required contradiction.
\end{proof}


\vfill \pagebreak
\begin{center}
Dec. 15, 2006
\end{center}

\subsection{solving cubic polynomials}
In this section, we are going to review classical result on
solving polynomials by using non-classical language. I think this
experience also serve a good start for Galois theory in general.

\begin{defn}
A {\bf character} from a group $G$ to a field $K$ is group
homomorphism  $\chi: G \to K^*$. The set of characters is denoted
$Hom_{gp}(G, K ^*)$.
\end{defn}

Let $Hom(G,K)$ be the set of functions from $G$ to $K$. It's clear
that $Hom(G,K)$ is a $K$-vector space.

\begin{thm}[E. Artin]
$Hom_{gp}(G,K^*)$ is linearly independent in $Hom(G,K)$.
\end{thm}


\begin{proof}
Suppose on the contrary that $Hom_{gp}(G,K^*)$ is not linearly
independent. Pick a linearly dependent subset
$\{\chi_1,...,\chi_n\}$ of minimal $n$. There are $a_i \in K$ such
that $\sum a_i \chi_i =0$, i.e. $$\sum a_i \chi_i ( g) =0,
\eqno(*)$$ for all $g \in G$. We can rewrite it as $$\sum a_i
\chi_i (gh)=0, \eqno(**)$$ for all $g,h \in G$. Multiply $(*)$ by
$\chi_1(h)$, we get
$$ \sum a_i \chi_i(g) \chi_1(h)=0. \eqno (***)$$ Compare $(*)$
with $(***)$, we get
$$ \sum a_i ( \chi_i(h)-\chi_1(h)) \chi_i(g) =0 \text{ for all } g \in G.$$
Thus $\sum_{i=2}^n a_i ( \chi_i(h)-\chi_1(h)) \chi_i =0 \in
Hom(G,K)$. It follows that the $n-1$ elements
$\{\chi_2,...,\chi_n\}$ is linearly dependent, which is a
contradiction to the minimality.
\end{proof}

\begin{cor}
Let $F/K$ be an extension. The set of $K$-homomorphisms from $F$
to $\overline{K}$ is linearly independent  in the
$\overline{K}$-vector space of linear maps from $F$ to
$\overline{K}$.
\end{cor}

\begin{proof}[Sketch.]
Take $G= F^*$.
\end{proof}

Let $K$ be a field containing $n$-th root of unity $\zeta$. Let
$F/K$ be a Galois extension with Galois group $\cong \bZ_n$
generated by $\sigma$. We consider
$$ \psi_\zeta: = 1+ \zeta \sigma + \zeta^2 \sigma^2 +...+ \zeta^{n-1}
\sigma^{n-1} \in Hom(F, \overline{K}).$$ Any element of the form
$\psi(x)$ is called a {\bf Lagrange resolvent}.

By direct computation, we have the following properties.

\begin{prop}
Keep the notation as above, we have:\\
\noindent $1.$ $ \sigma( \psi_\zeta(x))= \zeta^{-1}
\psi_\zeta(x)$.\\
\noindent $2.$  $\psi_1(x) \in K$.\\
\noindent $3.$ $(\psi_\zeta(x) )^n \in K.$ \\
\noindent $4.$ $(\psi_\zeta(x) ) (\psi_{\zeta^{-1}}(x) ) \in K$.\\
\noindent $5.$ $\sum_{\zeta \in \mu_n} \zeta^{-r} \psi_\zeta (x) =
n \sigma^r(x)$.
\end{prop}

Now we can use this technique to solve cubic equations. Let $f(x)
= x^3+px+q \in K[x]$ be an irreducible polynomial with
discriminant $D=-4p^3-27q^2 \in K$. We assume that $K$ contains a
primitive $3$-root of unity $\zeta$. We have extension $K \subset
L:=K[\sqrt{D}] \subset F:=K[u_1,u_2,u_3]$. Note that $F/L$ is
Galois with Galois group $\cong \bZ_3$.

\noindent {\bf Step 1.} $\psi_\zeta \ne 0 \in Hom(F,
\overline{K})$, in fact $\psi_\zeta(u_1) \ne 0$.\\

\noindent {\bf Step 2.} $\psi_\zeta(u_1) \ne L$ and
$(\psi_\zeta(u_1))^3 \in L$, thus
$F=L[\psi_\zeta(u_1)]$. \\
And similarly, $\psi_{\zeta^2}(u_1) \in L, (\psi_{\zeta^2}(u_1))^3
\in L$. Moreover, $\psi_\zeta(u_1)\psi_{\zeta^2}(u_1) \in L$.

\noindent {\bf Step 3.} Solve $\psi_\zeta(u_1)$,$\psi_{\zeta^2}(u_1)$ .\\
Recall that $$\Delta:= (u_1-u_2)(u_2-u_3)(u_3-u_1) =
u_1^2u_2+u_2^3u_3+u_3^2u_1-u_1u_2^2-u_2u_3^2-u_3u_1^2.$$
$$ \psi_\zeta(u_1)^3= u_1^3+u_2^3+u_3^3+3 \zeta (u_1^2u_2+u_2^2u_3+u_3^2u_1) +
\zeta^2 (u_1u_2^2+u_2u_3^2+u_3u_1^2) + 6u_1u_2u_3. $$ Let
$v_1=u_1^2u_2+u_2^2u_3+u_3^2u_1, v_2=u_1u_2^2+u_2u_3^2+u_3u_1^2$,
then $$v_1+v_2 = (u_1+u_2+u_3)(u_1u_2+u_2u_3+u_3u_1)-3u_1u_2u_3=
3q, $$
$$ v_1-v_2= \Delta.$$

Thus $ \psi_\zeta(u_1)^3$ can be expressed in terms of $p,q,
\Delta$.

 \noindent {\bf Step 4.} solve $u_1,u_2,u_3$ in terms of
$\psi_\zeta(u_1)$,$\psi_{\zeta^2}(u_1)$.\\
By the property $5$ above, we have
$$ 3u_1=\psi_1(u_1) + \psi_\zeta(u_1)+\psi_{\zeta^2}(u_1),$$
$$ 3u_2 = 3 \sigma(u_1)=\psi_1(u_1) + \zeta^{-1}\psi_\zeta(u_1)+
\zeta^{-2} \psi_{\zeta^2}(u_1),$$
$$3u_3 =3\sigma^2(u_1)= \psi_1(u_1) + \zeta^{-2}\psi_\zeta(u_1)+
\zeta^{-1} \psi_{\zeta^2}(u_1).$$ And note that $\psi_1(u_1)=0$.
So one can solve cubic polynomial explicitly.




\subsection{ cyclic extension}

The discussion in the previous section can be extended to a more
general setting.

\begin{defn}
We say that an  extension is cyclic (resp. abelian) if it's
algebraic Galois  and $\gal_{F/K}$ is cyclic (resp. abelian). An
cyclic extension of order $n$ is an cyclic extension whose Galois
group is isomorphic to $\ZZ_n$.
\end{defn}

The following theorem characterize cyclic extension except some
exceptional case.
\begin{thm} \label{cyclicext_np}
Suppose that $char(K)=0$ or $char(K)=p \nmid n$. Suppose
furthermore that there is a primitive $n$-th root of unity in $K$,
say $\zeta$. Then $F/K$ is a cyclic of order $n$ if and only if
$F=K(u)$ where $u$ is a root of irreducible polynomial $x^n-a \in
K[x]$.
\end{thm}

Before we get into the proof. Let's consider the "difference"
between $u$ and $\sigma(u)$ for  $\sigma \in \gal_{F/K}$. Let
$F/K$ be a finite Galois extension. Then in this circumstance,
norm and trace (which we will define more generally later) are
nothing but $N_{F/K}(u):=\prod_{\sigma \in \gal_{F/K}} \sigma(u)$
and $ T_{F/K}:=\sum_{\sigma \in \gal_{F/K}} \sigma(u)$. It's easy
to see that $T(u-\sigma(u))=0$ and $N(u/\sigma(u))=1$. The follows
lemma says that the converse is also true for cyclic extension,
which will play the central role in the study of cyclic extension.

\begin{lem} \label{hilbert90}
Let $F/K$ be an cyclic extension with $\sigma$ the generator of
the Galois group.
\begin{enumerate}
\item If $T_{F/K}(u)=0$, then there exists an $v \in F$ such that
$u=v-\sigma(v)$.

\item (Hilbert's Theorem 90) If $N_{F/K}(u)=1$, then there exists
an $v \in F$ such that $u=v/\sigma(v)$.
\end{enumerate}
\end{lem}

\begin{proof}[Proof of the Theorem \ref{cyclicext_np}]
Let $u$ be a root of $x^n-a$, then all the roots are $u\zeta^i$
for $i=0,...,n-1$. Since $\zeta \in K$. We can produce an element
in Galois group by considering  $\sigma_i: u \mapsto u \zeta^i$.
Thus we have $\{\sigma_i\}_{i=0,...,n-1} \subset \gal_K F $.  It's
clear that $\gal_K F= \{\sigma_i\}_{i=0,...,n-1} = <\sigma_1>$.
Thus $F=K(u)$ is a cyclic extension over $K$.

Conversely, suppose that  $F/K$ is a cyclic extension of order
$n$. Since there is a primitive $n$-th root $\zeta \in K$, one has
$N(\zeta)=\zeta^n=1$. By the Lemma, there exist an $v$ such that
$\zeta=v/\sigma(v)$. Let $u=v^{-1}$, then $\sigma(u)=\zeta u$.
Hence $\sigma(u^n)=u^n \in K$. Therefore $u$ satisfies $x^n-a \in
K[x]$ for some $a \in K$.

Moreover, for $u \zeta^i$ and $u \zeta^j$, there is an
automorphism sending $u \zeta^i$ to $u \zeta^j$. So they have the
same minimal polynomial $p(x)$ dividing $x^n-a$. One the other
hand, $p(x)$ has $n$ distinct roots $u \zeta^i$ for $i=0,...,n-1$.
It follows that $p(x)=x^n-a$ is irreducible. One has $[K(u):K]=n$
and thus $F=K(u)$.
\end{proof}

\begin{thm}
Suppose that $char(K)=p \ne 0$. Then $F/K$ is a cyclic extension
of order $n$ if and only if $F=K(u)$, where $u$ is a root of an
irreducible polynomial $x^p-x-a \in K[x]$.
\end{thm}

\begin{proof}
The proof is parallel to the previous one.

Let $u$ be a root of $x^p-x-a$, then all the roots are $u+i$ for
$i=0,...,p-1$. It's clear that $F=K(\zeta)$ is a cyclic extension
over $K$ with Galois group generated by $\sigma$ such that
$\sigma(u)=u+1$.

Conversely, suppose that  $F/K$ is a cyclic extension of order
$n$. One has $T(1)=p=0$. By the Lemma, there exist an $v$ such
that $1=v-\sigma(v)$. Let $u=-v$, then $\sigma(u)=u+1$. Hence
$\sigma(u^p)=u^p +1 $ and $\sigma(u^p-u)=u^p-u$. Therefore $u$
satisfies $x^p-x-a \in K[x]$ for some $a \in K$.

Moreover, for $u +i$ and $u +j$, there is an automorphism sending
$u \zeta^i$ to $u \zeta^j$. So they have the same minimal
polynomial $p(x)$ dividing $x^p-x-a$. One the other hand, $p(x)$
has $p$ distinct roots $u +i$ for $i=0,...,p-1$. It follows that
$p(x)=x^p-x-a$ is irreducible. One has $[K(u):K]=n$ and thus
$F=K(u)$.
\end{proof}

It remains to define norm and trace, and prove the main lemma
\ref{hilbert90}.

\begin{defn}
Let $[F:K]$ be a finite separable extension. Let $\Sigma$ be the
set of $K$-embeddings of $F$ into $\overline{K}$. For any $u \in
F$, we define the norm, denoted $$N_{F/K}(u):=(\prod_{\sigma \in
\Sigma} \sigma(u) ).$$ Similarly, we define the trace as
$$ T_{F/K}(u):=(\Sigma_{\sigma \in \Sigma}
\sigma(u) ).$$
\end{defn}

\begin{ex}
If $F/K$ is finite Galois extension, then the set of all
$K$-embeddings of $F$ is nothing but the Galois group of $F$
(since $F$ is normal). Therefore, $N_{F/K}(u)=\prod_{\sigma \in
\gal_{F/K}}\sigma(u)$ and $T_{F/K}(u)=\sum_{\sigma \in
\gal_{F/K}}\sigma(u)$
\end{ex}



\begin{proof}[Proof of Lemma \ref{hilbert90}]
We only prove that $T(u)=0$ implies $u=v-\sigma(v)$. The other
implication is easy.

{\bf Step 1.} Find an element $z\in F$ with $T(z) \ne 0$. This is
an immediate consequence of independency of automorphism.

{\bf Step 2.} We normalize it to get $w \in F$ with $T(w)=1$. In
fact, we take $w:= \frac{z}{T(z)}$.

{\bf Step 3.} Let $$v=
uw+(u+\sigma(u))\sigma(w)+...+(u+\sigma(u)+...+\sigma^{n-2}(u))\sigma^{n-2}(w).$$
Then by direct computation and $T(u)=\sum \sigma(u)=0$,  we are
done.

For the norm, if $N(u)=1$, then $u \ne 0$. Take $$v=uy+u \sigma(u)
\sigma(y)+...+ u \sigma(u)...\sigma^{n-1}(u)\sigma^{n-1}(y).$$ By
independency of automorphism, there exist a $y$ such that $v$ is
non-zero. One checks that $u^{-1}v=\sigma(v)$. We are done.
\end{proof}


\subsection{radical extension}

\begin{defn}
$F/K$ is said to be an radical extension if $F=K(u_1,...,u_n)$
such that for $1 \le i \le n$,  $u_i^{n_i} \in
K(u_1,...,u_{n-1})$.

For a polynomial $f(x) \in K[x]$. We say $f(x)=0$ is solvable by
radical if its splitting field $E$ is contained in some radical
extension.
\end{defn}

\begin{rem}
In the definition, it's not necessary that the splitting field
itself is a radical extension over $K$.
\end{rem}

The main observation is the following:

\begin{prop} \label{rad_w_root}
Let $F/K$ be a radical and Galois extension over $K$. Write
$F=K(u_1,...,u_n)$ such that for $1 \le i \le n$,  $u_i^{n_i} \in
K(u_1,...,u_{n-1})$. Let $m=\prod n_i$ and assume that $char(K)
\nmid m$.  Suppose furthermore that $K$ contains a primitive
$m$-th root of unity. Then $\gal_{F/K}$ is solvable.
\end{prop}

\begin{proof}
Let $K_i:=K(u_1,...,u_i)$. And let $G_i=K_i'$. One sees that $K_1$
is cyclic over $K$, hence Galois over $K$. Hence $G_1 \lhd
G_0=\gal_{F/K}$. Consider next $F/K_1$ which is radical and
Galois. Then $K_2$ is cyclic over $K_1$ and hence similarly, $G_2
\lhd G_1$. Therefore, we have a solvable series $\{e\}=G_n \lhd
G_{n-1} \lhd ... \lhd G_0=\gal_{F/K}$ with $G_{i-1}/G_i$ cyclic.
We are done.
\end{proof}

One can actually generalize it to the following general setting:
\begin{thm}
Let $F/K$ be a radical extension, and $K \subset E \subset F$.
Then $\gal_{E/K}$ is solvable. As a consequence, if $f(x)=0$ is
solvable by radical, then $G_f$ is solvable.
\end{thm}

\begin{proof}
We first reduce to simpler situation.\\
\noindent {\bf Step 1.} Let $G=\gal_{E/K}$ and $K_0=G'$. It's
clear that $F/K_0$ is radical, and $E/K_0$ is Galois for
$\gal_{E/K_0} =G''=G$ and $G'''=G'$. Thus $F/K_0$ is radical and
$E/K_0$ is Galois with Galois group $\gal_{E/K}$.

We thus  replacing $K$ by $K_0$ and assume that $E/K$ is Galois.


\noindent {\bf Step 2.} Reduce to the case that $E=F/K$ is Galois.
To see this, let $\sigma: F \to \overline{K}$ be an $K$-embedding.
One can show that $ \sigma(F)$ is again a radical extension. One
can also prove that if $F_1,F_2 \subset \overline{K}$ are radical
extension over $K$, then $F_1F_2$ is a radical extension over $K$.
Hence let $N$ be the compositum of $\sigma(F)$ for all $\sigma$.
It follows that $N$ is radical over $K$. Moreover, $N$ is normal
over $K$.

Since $E/K$ is Galois, in particular, $E$ is normal over $K$ and
$E$ is a stable intermediate subfield of $N/K$. Then one has a
homomorphism $\gal_{N/K} \to \gal_{E/K}$. This is surjective
because $N$ is normal. Thus it suffices to prove that $\gal_{N/K}$
is solvable.


\noindent {\bf Step 3.} By the same trick an in Step 1. We may
assume that $N/K$ is Galois. Therefore, it suffices  to show that
if $F/K$ is Galois and radical, then $\gal_{F/K}$ is solvable.

\noindent {\bf Step 4.} Since $F/K$ is separable, we may assume
that $(\chr(K),n_i)=1$. Let $m=\prod n_i$.

Let $\zeta$ be a primitive $m$-th root of unity. We claim that
$F(\zeta)$ is Galois over $K$. Grant this for the time being, then
$F(\zeta)$ is Galois over $K(\zeta)$ and $K(\zeta)' \lhd
\gal_{F(\zeta)/K}$. Moreover, $\gal_{F(\zeta)/K}/K(\zeta)' \cong
\gal_{K(\zeta)/K}$. By  Proposition \ref{rad_w_root}, $K(\zeta)'$
is solvable. $K(\zeta)/K$ is cyclotomic, hence $\gal_{K(\zeta)/K}$
is solvable. Thus, $\gal_{F(\zeta)/K}$ is solvable.

Now $F/K$ is Galois, $\gal_{F/K} \cong \gal_{F(\zeta)/K} /F'$
which is solvable.

\noindent {\bf Step 5.} To prove the claim, suppose that $F$ is a
splitting field of separable polynomial $f_1,..,f_n \in K[x]$.
Then $F(\zeta)$ is nothing but a splitting field of separable
polynomials $f_1,...,f_n,x^m-1$. Thus we are done.
\end{proof}

\begin{thm}
Let $E$ be a finite dimensional Galois extension over $K$ with
solvable Galois group. Assume that $char(K) \nmid [E:K]$, then
there is a radical extension $F/K$ containing $E$.
\end{thm}

\begin{proof}
We prover by induction on $[E:K]$. Let $n=[E:K]$ and assume the
theorem is true for all Galois extension of degree $<n$.

Let $\zeta$ be a primitive $n$-th root of unity. Then
$E(\zeta)/K(\zeta)$ is Galois. If $[E(\zeta):K(\zeta)]< n$ then we
are done by induction hypothesis and the fact that $K(\zeta)/K$ is
radical.

By replacing $E,K$ by $E(\zeta),K(\zeta)$ respectively, we my
assume that $K$ has $m$-th root of unity.

$\gal_{E/K}$ is solvable, let $H$ be a subgroup of index $q$, for
some prime $q$. Then $H'/K$ is a cyclic extension, hence a radical
extension. By induction hypothesis, $E/H'$ is radical. We are
done.
\end{proof}

\begin{cor}
Let $f(x) \in K[x]$ be a polynomial of degree $n >0$. Suppose that
$char(K) \nmid n!$, then $f(x)=0$ is solvable by radical if and
only if $G_f$ is solvable.
\end{cor}


\vfill \pagebreak
\begin{center}
Dec. 22, 2006
\end{center}


\subsection{separability and inseparability}

We first recall something about separable extension.


To start with, let $f(x)$ be an irreducible polynomial in $K[x]$
and $f'(x)$ be its derivative (formally). More precisely, if
$f(x)= \sum_{i=0}^n a_i x^i$, then $f'(x):=\sum_{i=1}^{n} i a_i
x^{i-1}$. One has the following equivalence:
\begin{enumerate}
\item $f(x)$ is separable, i.e. no multiple roots in
$\overline{K}$.

\item $(f(x),f'(x))=1 \in \overline{K}[x]$.

\item $(f(x),f'(x))=1 \in K[x]$.

\item $f'(x)=0$.
\end{enumerate}
Therefore, the only possibility to have non-separable polynomial
is $char(K)=p$ and $f(x)=g(x^p)$.

Given an element $u$ algebraic over $K$, one can define the
separable degree to be the number of distinct roots of minimal
polynomial. This notion can be extended to a general setting:

\begin{defn}
Let $F/K$ be an extension. Fix an embedding $\sigma: K \to
L=\overline{L}$. We define the separable degree of $F/K$, denoted
$[F:K]_s$, to be the cardinality of $$S_\sigma:=\{\tau: F \to L|
\tau_{|K}=\sigma \}.$$

In particular, if $F=K(u)$ for some $u$ with minimal polynomial
$p(x)$, then $[F:K]_s$ is the number of distinct roots of $p(x)$
in $\overline{K}$.
\end{defn}

One can check that $[F:K]_s$ is independent of $\sigma$ and $L$.
Hence the definition is well-defined. Moreover, if $F=K(u)$ for
$u$ algebraic over $K$, then $[F:K]_s=[K(u):K]_s$ is the number of
distinct roots of the minimal polynomial $p(x)$ of $u$. This can
be seen by considering $K$-embedding  $\tau :K(u) \to
\overline{K}$, $\tau(u)$ must be a root of $p(x)$ and $\tau$ is
determined by $\tau(u)$.

\begin{prop}
If $K \subset E \subset F$, then $[F:K]_s=[F:E]_s [E:K]_s$.
Moreover, if $F/K$ is finite, then $[F:K]_s \le [F:K]$.
\end{prop}

\begin{proof}[Sketch.]
The first statement follows from the definition.

It's clear that $[K(u):K]_s \le [K(u):K]$ by definition. Then by
induction, we have $[F:K]_s \le [F:K]$ if $[F:K]$ is finite.
\end{proof}

Then we have the following useful criterion:
\begin{prop}
If $F/K$ is finite, then $F/K$ is separable if and only if
$[F:K]_s=[F:K]$.
\end{prop}

\begin{proof}[Sketch.]
Suppose that $F/K$ is separable. Let $L$ be the maximal
intermediate subfield such that $[L:K]_s=[L:K]$. We claim that
$L=F$. Suppose not, let $u \in F -L$. Since $u$ is separable over
$K$, it's separable over $L$. Thus $[L(u):L]_s = [L(u):L]$. So
$[L(u):K]_s= [L(u):K]$ give the contradiction.

Conversely, for any $u \in F$, one sees that $$ [F:K]_s =
[F:K(u)]_s [K(u):K]_s \le  [F:K(u)] [K(u):K] \le [F:K].$$ Since
$[F:K]_s = [F:K]$, we have $[K(u):K]_s = [K(u):K]$. Thus $u$ is
separable over $K$.
\end{proof}

we can then prove the following:
\begin{thm}
Suppose that $F=K(S)$ such that each elements of $S$ is separable
over $K$, then $F/K$ is separable.
\end{thm}



\begin{proof}[Sketch.]
By the previous Proposition, one can see that if $u_1,u_2$ are
separable over $K$, then $K(u_1,u_2)$ is separable over $K$.

In general, if $u \in K(S)$, then $u \in K(u_1,...,u_n)$ for some
$u_1,...,u_n \in S$, hence separable over $K$. Then so is $u$.
\end{proof}


In particular, let $$S:=\{u \in F| u \text{ is separable over }
K\}.$$ Then $S$ is an intermediate subfield  over $K$. The reason
can be seen as following:  $u, v \in S$, $u+v,uv \in K(u,v)$.
Since $u, v$ are separable over $K$. Then $K(u,v)$ is an separable
extension. Thus elements in $K(u,v)$ are separable over $K$.

\begin{exer}
\end{exer}
Separable extension has the following properties:\\
\noindent $1$. Let $K \subset E \subset F$. Then $F/K$ is
separable if and only if $ F/E$ and $E/K$ are separable.\\
\noindent $2$ If $E/K$ is separable then $FE/F$ is separable for
an extension $F/K$.\\
\noindent $3$ If $E,F  \subset L$ are separable extension over
$K$. Then $EF$ is separable over $K$. \qed

\begin{exer}
\end{exer}
Let $F/K$ be a finite extension, then $[F:K]_s = [S:K]$. \qed

%\begin{prop}\label{insep}
%If $F/K$ is a finite extension, then $[F:K]_s \big|[F:K]$.
%Moreover, $[F:K] / [F:K]_s=p^n$ for some $n$.
%\end{prop}

Before we move onto the study of inseparability, we would like to
prove the famous theorem of primitive element.

\begin{thm}\label{prim_elem}
If $F/K$ is separable and finite, then $F=K(\alpha)$ for some
$\alpha \in F$.
\end{thm}

In order to prove the theorem we need to study simple extensions.
When the base field is finite, then things are easy.

\begin{prop}
If $K$ is a finite field and $F/K$ is an algebraic field
extension. The following are equivalent:
\begin{enumerate}
\item $F/K$ is finite.

\item $F=K(\alpha)$ for some $\alpha \in f$. That is, $F/K$ is a
simple extension.

\item There is only finitely many intermediate fields.
\end{enumerate}
\end{prop}

\begin{proof}
For $(1) \Rightarrow (2)$,  if $F/K$ is finite, then $F$ is
finite. $F^*$ is a cyclic multiplicative group, say
$F^*=<\alpha>$. Then it's clear that $F=K(\alpha)$.

$(2) \Rightarrow (1)$ is trivial.

$(1) \Rightarrow (3)$. Suppose that $|K|=q, |F|=q^n$. Let $E$ be
an intermediate field, then it's clear that $|E|=q^d$ for some
$d|n$. One can prove that for any $d|n$, there is exactly one
intermediate field with $q^d$ elements. Hence there are only
finitely many intermediate fields.

$(3) \Rightarrow (1)$. Suppose on the other hand that $F/K$ is not
finite. First consider the case that $F/K$ is not algebraic, i.e.
there is $u \in F$ not algebraic over $K$. Then we have infinitele
many intermediate subfields $K(u) \supset K(u^2) \subset K(u^4)
...$. Which is a contradiction.

Secondly, if $F/K$ is algebraic. Then it is not finitely
generated, otherwise it's finite. We can easily get (by axiom of
choice) a infinite sequence of intermediate fields
$$K \subset K(a_1) \subset K(a_1,a_2)...$$
by adding generators.
\end{proof}

\begin{prop}
Let $F/K$ be a finite extension, then $F=K(\alpha)$ if and only if
there is only finitely many intermediate fields.
\end{prop}

\begin{proof}
If $K$ is finite, then we are done by the previous Proposition. We
assume that $K$ is infinite.

Suppose that there is only finitely many intermediate fields. For
any $\alpha,\beta \in F$, we can consider intermediate fields
$K(\alpha+c\beta)$ as $c$ ranging in $K$. Since $K$ is infinite.
There must exists $c_1, c_2 \in K$ such that
$K(\alpha+c_1\beta)=K(\alpha+c_2 \beta)$. It's easy to check that
$$ K(\alpha,\beta)=K(\alpha+c\beta).$$
By induction on number of generators of $F/K$, we proved that
$F/K$ is a simple extension.

Suppose now that $F=K(\alpha)$. We would like to prove the
finiteness by using the following map:
$$\phi: \{E | K \subset E \subset F\} \to \Sigma:=\{p_E(x)\},$$
where $p_E(x)$ denotes  the minimal polynomial of $\alpha$ over
$E$. Since every $p_E(x)$ is a divisor of $p_K(x)$ in the
algebraic closure (or in the splitting field), it's clear that
$\Sigma$ is finite.

It's enough to prove that $\phi$ is injective. To this end, let
$E_0$ be the extension over $K$ generated by coefficient of
$p_E(x)$. One sees that $p_E(x) \in E_0[x]$ is irreducible and
hence a minimal polynomial of $\alpha$ over $E_0$. Hence we have
$$ [K(\alpha):E]=deg(p_E(x))=[K(\alpha):E_0].$$ It follows that
$E=E_0$. Thus, if $\phi(E)=\phi(E')$, then $E=E_0=E'$. This proved
the injectivity.
\end{proof}


\begin{proof}[Proof of Theorem \ref{prim_elem}]
We may assume that $K$ is infinite.  By induction on generators of
$F/K$, we may assume that $F=K(\alpha,\beta)$. Let $n:=[F:K]_s$,
and $\sigma_1,...,\sigma_n$ be the distinct embedding of $F$ in
$\overline{K}$. Let $$ P(x):=\prod_{i \ne j} (\sigma_i (\alpha+
\beta x )- \sigma_j ( \alpha - \beta x).$$ Since
$deg(P(x))=n(n-1)$ and there are infinitely many elements in $K$,
there must be an $c \in K$ such that $P(c) \ne 0$. Thus all
$\sigma_i( \alpha+c \beta)$ are all distinct. This gives $n$
distinct embedding of $K(\alpha+c \beta)$. One has
$$ [F:K]_s =n \le [K(\alpha+c \beta):K]_s \le [K(\alpha+c \beta):K] \le [F:K].$$
Since $F/K$ is separable, so is $[F:K]_s =[F:K] $. Thus
$[K(\alpha+c \beta):K] \le [F:K]$, and therefore,
$K(\alpha,\beta)=F=K(\alpha+c \beta)$.
\end{proof}

We now turn our interest to non-separable extension. Instead of
non-separable extension in general, we first study the special
case the all roots of minimal polynomial are the same.

\begin{defn}
Let $F/K$ be an extension. An element $u \in F$ is purely
inseparable over $K$ if its minimal polynomial $p(x) \in K[x]$
factors in $F[x]$ as $(x-u)^m$. An extension $F/K$ is purely
inseparable over $K$ if every element of $F$ is purely inseparable
over $K$.
\end{defn}

It's easy to see that an element $u \in F$ which is both separable
and purely inseparable over $K$ if and only if $u \in K$.

Another useful observation is:
\begin{lem}\label{insep}
Let $F/K$ be an extension with $char(K)=0 \ne 0$. If $u \in F$ is
algebraic over $K$, then $u^{p^n}$ is separable over $K$ for some
$n \ge 0$.
\end{lem}
\begin{proof}
The point is that if $u$ is not separable, then its minimal
polynomial $p(x)$ is of the form $f(x^p)$. Then $f(x)$ is the
minimal polynomial of $u^p$. By induction on degree of $u$, we are
done.
\end{proof}

Being purely inseparable has the following equivalent formulation:
\begin{thm}
Let $F/K$ be an algebraic extension with $\chr(K)=p \ne 0$. The
following are equivalent:
\begin{enumerate}
\item $F/K$ is purely inseparable, i.e. every element $u\in F$ has
minimal polynomial of the form $(x-u)^m$.

\item for all $u \in F$, the minimal polynomial is of the form
$x^{p^n}-a \in K[x]$.

\item for all $u \in F$, $u^{p^n} \in K$ for some $n \ge 0$.

\item $S=K$, that is, the only element of $F$ which is separable
over $K$ are the elements in $K$.

\item $F/K$ is generated by purely inseparable elements.
\end{enumerate}
\end{thm}

\begin{proof}
Let $m=p^n r$. $$(x-u)^m=(x-u)^{p^n r}= (x^{p^n}-u^{p^n})^r=x^m-r
u^{p^n} x^{p^n(r-1)}+... \in K[x].$$ Therefore, $u^{p^n} \in K$,
this proved $(1) \Rightarrow (3)$.

Moreover, $p'(x):=x^{p^n}-u^{p^n}) \in K[x]$ and $p'(x)^r$ is the
minimal polynomial of $u$ (hence irreducible). Therefore, $r=1$.
This proved $(1) \Rightarrow (2)$.

$(2) \Rightarrow (3)$ is trivial.

For $(3) \Rightarrow (1)$, let $a=u^{p^n} \in K$, then
$f(x):=x^{p^n}-a \in K[x]$ and factors in $F[x]$ as $(x-u)^{p^n}$.
Hence the minimal polynomial of $u$ over $K$ is a factor of $f(x)$
and factors into $(x-u)^m$ in $F[x]$.

We have seen $(1) \Rightarrow (4)$ and $(5)$, $(4) \Rightarrow
(3)$ follows from the above Lemma \ref{insep}.

It remains to show that $(5) \Rightarrow (3)$. To see this, first
note that $F=K(\Sigma)$ where $\Sigma$ consists of elements $u_i$
such that $u_i^{p^n} \in K$ for some $n$ (By the proof of $(1)
\Rightarrow (3))$. For any $u \in F$, say $u
=\frac{f(u_1,...,u_r)}{g(u_1,...,u_r)}$. Pick $N$ such that $
u_i^{p^N} \in K, \forall i=1,...,r$. Then $u^{p^N} \in K$.
\end{proof}

As a corollary, one can show that $$P:=\{ u \in F| u \text{ is
purely inseparable over } K\}$$ is an intermediate subfield.

\begin{thm}
Let $F/K$ be an algebraic extension. Keep the notation as above
for $S,P$.
\begin{enumerate}
\item $S/K$ is separable.

\item $P/K$ is purely inseparable.

\item $F/S$ is purely inseparable.

\item $F/P$ is separable if and only $F=PS$.

\item $P \cap S =K$.

\item if $F/K$ is normal, then $S/K$ and $F/P$ are Galois. And
$\gal_{F/K}=\gal_{F/P} \cong \gal_{S/K}$.
\end{enumerate}
\end{thm}

\begin{proof}
We have seen $(1),(2),(5)$. $(3)$ follows from Lemm \ref{insep}.
For $(4)$, look at $P \subset SP \subset F$. If $F/P$ is
separable, then $F/SP$ is separable. Look at $S \subset SP \subset
F$ now. We have $F/K$ is purely inseparable, thus so is $F/SP$.
Thus $F=SP$.

On the other hand, if $F=SP=P(S)$, then clearly $F=P(S)$ is
separable over $P$.

Lastly, we look at $G:=\gal_{F/K}$. We claim that $G'=P$, hence
$F/P$ is Galois with Galois group $\gal_{F/P}=\gal_{F/K}$.

To see the claim, if $u \in P$, then it's clear that $\sigma(u)=u$
for all $\sigma \in G$. Therefore, $P \subset G'$. On the other
hand, if $u \in G'$ and $v$ is another root of $p(x)$, the minimal
polynomial of $u$. There is an $\sigma$ such that $\sigma(u) =v$.
Since $F/K$ is normal, this $\sigma$ can be extended to $G$. But
$u\in G'$, thus $v=u$, in other words, $p(x)=(x-u)^m$.

$F$ is Galois over $P$ because $P=G'$. Hence $F/P$ is separable.
By $(5)$, $F=PS$.

 Lastly, we consider $\gal_{F/P}=\gal_{F/K} \to
\gal_{S/K}$ by restriction. This is well-defined since $S$ is
stable. More precisely, for $u \in S$, $\sigma(u) \in S$ for all
$\sigma \in G$ because $\sigma(u)$ has the same minimal polynomial
as $u$ does. This is surjective by extension theorem. It remains
to show the injectivity. If $\sigma|_S=\tau|_S$, then for all $u
\in F$ we have $u^{p^n} \in S$. Thus,
$$\sigma(u)^{p^n}=\sigma(u^{p^n})=\tau(u^{p^n})=\tau(u)^{p^n}.$$
It follows that $\sigma(u)=\tau(u)$.

It remains to show that $S/K$ is Galois. To see this, suppose $u
\in S$ is fixed by all $\sigma \in G$, then $u \in G'=P$. Hence $u
\in K$. We are done.
\end{proof}


\begin{defn}
Let  $F/K$ be a finite extension. We define the inseparable degree
of $F/K$, denoted $[F:K]_i$, to be $[F:K]/[F:K]_s$. \end{defn}

Note that  $[F:K]_i=[F:S]=p^n$ for some $n$.


If $\chr(K)=p \ne 0$, we write $K^p=\{u^p | u \in K\}$.
\begin{defn}
$K$ is said to be perfect if $K^p=K$
\end{defn}

\begin{ex}
Finite fields are perfect. $\bF_p(x)$ is not perfect.
\end{ex}

\begin{cor}
Let $F/K$ be an algebraic extension with $\chr(K)=p \ne 0$. We
have
\begin{enumerate}
\item If $F/K$ is separable, then $F=KF^{p^n}$ for each $n \ge 1$.

\item If $F/K$ is finite and $F=KF^p$, then $F/K$ is separable.

\item In particular, $u \in F$ is separable over $K$ if and only
if $K(u^p)=K(u)$.
\end{enumerate}
\end{cor}


Note that $F^p$ is not necessarily an extension over $K$. So is
$F^{p^n}$. But we can take $KF^{p^n}$, which is an extension over
$K$.

\begin{proof}
We first suppose that $F/K$ is finite, hence finitely generated.
Write $F=K(u_1,...,u_r)$. It's clear that there is $N \ge 1$ such
that $u^{p^N} \in S$. Hence $F^{p^N} \subset S$, therefore,
$KF^{p^N} \subset S$.

We claim that $S=KF^{p^N}$. To see this, one notices that $F$ is
purely inseparable over $KF^{p^N}$, so is $S$ purely inseparable
over $KF^{p^N}$. And on the other hand, $S$ is separable over $K$,
so is over $KF^{p^N}$. Hence $S=KF^{p^N}$.

For (1), if $F/K$ is separable and finite, then we have
$F=KF^{p^N}$. However, in the proof, one can choose $N$ to be
arbitrary large. More precisely, one has $F=KF^{p^N}$ for all $N
\ge N_0$. By looking at the inclusion $$ F=KF^{p^N} \subset
KF^{p^{N-1}} \subset ... \subset KF^p \subset F.$$ One has
$F=KF^{p^n}$ for all $n \ge 1$.

Suppose now that $F/K$ is separable but not necessarily finite.
For any $u \in F$, we consider $F_0:=K(u)$ which is separable and
finite over $K$. Thus $u \in F_0 = K F_0^{p^n} \subset K F^{p^n}$
for all $n \ge 1$. This proves $(1)$.

We now prove $(2)$. If $F=KF^p$, then $F=K(KF^p)^p=KF^{p^2}$.
Inductively, one has $F=KF^{p^n}$ for all $n \ge 1$. Since we have
show that $S=KF^{p^N}$, it follows that $F=S$.

Apply the statement to a single element. We consider $F=K(u)$.
$F^p \subset K^p(u^p) \subset K(u^p)$ . Indeed, $KF^p=K(u^p)$. By
$(2)$, if $K(u)=K(u^p)$, then $u$ is separable. By $(1)$, if $u$
is separable, then $K(u)=K(u^p)$.
\end{proof}



\subsection{transcendental extension} We now start our discussion
on transcendental extension. The main purpose is to show that the
concept of {\it transcendental degree}, which is the cardinality
of transcendental basis,  can be well-defined. Moreover,
transcendental degree is a good candidate for defining dimension.

\begin{defn}
Let $F/K$ be an extension. $S \subset F$ is said to be
algebraically dependent (over $K$) if there is an $n \ge 1$ and an
$f \ne 0 \in K[x_1,...,x_n]$ such that $f(s_1,...,s_n)=0$ for some
$s_1,...,s_n \in S$. Roughly speaking, some element of $S$ satisfy
a non-zero algebraic relation $f$ over $K$.

$S$ is said to be algebraically independent over $K$ if it's not
algebraically dependent over $K$.
\end{defn}

\begin{ex}
For any $u \in F$, $\{u\}$ is algebraically dependent over $K$ if
and only if $u$ is algebraic over $K$.
\end{ex}

\begin{ex}
In the extension $K(x_1,...,x_n)/K$, $S=\{x_1,...,x_n\}$ is
algebraically independent over $K$.
\end{ex}

\vfill \pagebreak
\begin{center}
Dec. 29, 2006
\end{center}

The following theorem says that finitely generated purely
transcendental extension are just rational function fields.

\begin{thm}
If $\{s_1,...,s_n\} \subset F$ is algebraically independent over
$K$. Then $K(s_1,...,s_n) \cong K(x_1,...,x_n)$.
\end{thm}

\begin{proof}
We consider the homomorphism $\theta: K[x_1,...,x_n] \to
K[s_1,...,s_n]$. $\theta$ is surjective by definition. It's
injective because $\{s_1,...,s_n\} \subset F$ is algebraically
independent. Then $\theta$ induces an isomorphism on quotient
fields.
\end{proof}

One notices that the notion of being algebraic independent is an
analogue of being linearly independent. Therefore, one can try to
define the notion of "basis" and "dimension" in a similar way.

\begin{defn}
$S \subset F$ is said to be a transcendental basis of $F/K$ if $S$
is a maximal algebraically independent set. In other words, for
all $u \in F-S$, $S \cup \{u\}$ is algebraically dependent.
\end{defn}

We will then define the {\it transcendental degree} to be the
cardinality of a transcendental basis (in a analogue of
dimension). In order to show that this is well-defined. We need to
work harder.

\begin{prop}
Let $S \subset F$ be an algebraically independent set over $K$ and
$u \in F-K(S)$. Then $S \cup \{u\}$ is algebraically independent
if and only if $u$ is transcendental over $K(S)$.
\end{prop}

\begin{proof}
The proof is straightforward.
\end{proof}

\begin{cor}
$S$ is a transcendental basis of $F/K$ if and only if $F/K(S)$ is
algebraic.
\end{cor}

\begin{proof}
Suppose that $S$ is a transcendental basis of $F/K$. If $u \in
F-K(S)$, then $S \cup \{u \}$ is not algebraically independent.
Thus, $u$ is algebraic over $K(S)$ by the Proposition.

On the other hand, suppose that $F/K(S)$ is algebraic. Then for
all $u \in F-S$, $u$ is algebraic over $K(S)$. By the Proposition,
$S \cup \{u\}$ is algebraically dependent if $u \in F-K(S)$. In
fact, it's easy to see directly that $S \cup \{u\}$ is
algebraically dependent if $u \in K(S)$. Thus $S$ is a maximal
algebraically independent set.
\end{proof}

\begin{cor}
Let $S \subset F$ be an subset over such that $F/K(S)$ is
algebraic. Then $S$ contains  a transcendental basis.
\end{cor}

\begin{proof}
By Zorn's Lemma, there exists a maximal algebraically independent
subset $S' \subset S$. Then $K(S)$ is algebraic over $K(S')$ and
hence $F$ is algebraic over $K(S')$.
\end{proof}

\begin{thm}
Let $S,T$ be  transcendental bases of $F/K$. If $S$ is finite,
then $|T|=|S|$.
\end{thm}

\begin{proof}
Let $S=\{s_1,...,s_n\}$ and $S':=\{s_2,...,s_n\}$. We first claim
that there is an element $t \in T$ , say $t=t_1$ such that
$\{t_1,s_2,...,s_n\}$ is a transcendental basis.

to see this, if every element of $T$ is algebraic over $K(S')$,
then $F$ is algebraic over $K(T)$ hence over $K(S')$ which is a
contradiction. Thus, there is an element $t \in T$ , say $t=t_1$
such that $t_1$ is transcendental over $K(S')$. And hence
$T':=\{t_1,s_2,...,s_n\}$ is algebraically independent.

By the maximality of $S$, one sees that $s_1$ is algebraic over
$K(T')$. It follows that $F$ is algebraic over
$K(t_1,s_1,...,s_n)$ and hence algebraic over $K(T')$. Therefore,
$T'$ is a  transcendental basis.

By induction, one sees that there is a transcendental basis
$\{t_1,...,t_n\} \subset T$. Thus $T=\{t_1,...,t_n\}$.
\end{proof}


\begin{thm}
Let $S,T$ be  transcendental bases of $F/K$. If $S$ is infinite,
then $|T|=|S|$.
\end{thm}

\begin{proof}
By the previous theorem, we may assume that $T$ is infinite as
well.

For $s \in S$, we have $s \in F$ hence algebraic over $K(T)$. Let
$T_s \subset T$ be the subset of $T$ of elements that appearing in
the minimal polynomial of $s$. It's clear that $T_s \ne \emptyset$
otherwise, $s$ is algebraic $K$ which is not the case. Also note
that $T_s$ is finite.

Let $T':=\cup_{s \in S} T_s$. We claim that $T'=T$. To this end,
one sees that for $u \in F$, $u$ is algebraic over $K(S)$ and
hence algebraic over $K(T')$. Thus $F/K(T')$ is algebraic. $T$ is
a transcendental basis, hence $T=T'$.

Lastly, one sees that $$|T|=|T'| = |\cup_{s\in S} T_s| \le |S|
\cdot \aleph_0 = |S|.$$ Replace $S$ by $T$, one has $|S| \le |T|$.
We are done.
\end{proof}

With these two theorem, we can define the transcendental degree of
an extension. And the definition is independent of choices of
basis.

\begin{defn}
Let $F/K$ be an extension and $S$ be a transcendental basis. We
define the transcendental degree of $F/K$, denoted ${\rm tr.d.}
F/K$, to be $|S|$.
\end{defn}

\begin{thm}
Let $F/E$ and $E/K$ be extensions. Then
$$ {\rm tr.d.}F/K={\rm tr.d.} F/E+{\rm tr.d.}E/K.$$
\end{thm}

\begin{proof}
Let $T$ be a transcendental basis of $F/E$ and $S$  be a
transcendental basis of $E/K$. We would like to show that $S \cup
T$ is a transcendental basis of $F/K$. Note that $T \cap E =
\emptyset$, hence $S \cap T =\emptyset$. Thus $|S\cup T|=|S|+|T|$,
and we are done.

To see the claim, it's easy to check that $E(T)=E K( S \cup T)$.
Hence $E(T)/K( S \cup T)$ is algebraic if $E/K(S)$ is algebraic.
Also, $F/E(T)$ is algebraic, therefore, $F/K(S \cup T)$ is
algebraic.

It suffices to show that $S \cup T$ is algebraically independent.
Suppose that there is $f(x_1,...,x_n,y_1,...,y_m)$ such that
$f(s_1,...,s_n,t_1,...,t_m)=0$. We can write
$$f(x_1,...,x_n,y_1,...,y_m)= \sum_{I} h_I(x_1,...,x_n) y^I,$$
and  we have $\sum_{I} h_I(s_1,...,s_n) t^I$. Since $T$ is
algebraically independent over $E \ni h_I(s_1,...,s_n)$. It
follows that $h_I(s_1,...,s_n)=0$ for all $I$. Since $S$ is
algebraically independent over $K$, if follows that
$h_I(x_1,...,x_n)=0 \in K[x_1,...,x_n]$ for all $I$. Therefore
$f(x_1,...,x_n,y_1,...,y_m)=0$. Hence $S \cup T$ is algebraically
independent.
\end{proof}

\begin{ex}
\end{ex}
Let $V : =\{ (a,b)  | a^3=b^2, a,b \in K\}$. Then "polynomial
function on $V$ can be described as $R:=K[x,y]/(y^2-x^3)$. And
rational functions on $V$ is nothing but the field of quotient of
$R$, denoted $F$. Then ${\rm tr.d.}_KF=1$, which is the same as
the "dimension of $V$". \qed

Some related problems:\\
\noindent 1. L\"uroth's theorem and rationality problem.\\
The L\"uroth's theorem states that a non-trivial subfield of
$k(x)$ is of the form $k(t)$, where $t \in K(x)$. More generally,
one can ask a subfield $E \subset K(x,y)$ of  $\rm{tr.d}_K=2$ is
purely transcendental or not. One can prove that this is true when
$K = \bC$ by geometric method. However, this is not true in
general when transcendental degree is higher.

Nevertheless, suppose that there is a finite group $G$ acts on
$k(x_1,...,x_n)$. One can ask whether the subfield of invariant
purely transcendental or not. Or under what condition, the field
of invariant is purely transcendental. A variety (as $V$ above) is
called {\bf rational} if its rational function field is purely
transcendental. So this is called {\bf rationality problem}.

\noindent 2. Automorphism of function fields.\\
Consider $F=K(x)$. It's well-known that $\Aut_K(F) = PGL(2,K)$.
How about $K$-automorphism $F=K(x_1,...,x_n)$?

\noindent 3. Characterize birational invariants.\\
Varieties as said to be birational if their function fields are
isomorphic. Therefore, those birational invariant, which reflect
the birational geometry of varieties, are invariant of fields. Can
you read it from the fields?

\vfill \pagebreak

\section{Homological Algebra}

Some useful references:\\
 \noindent Serge Lang,{\it  Algebra}, GTM 211, Springer \\
S. Gelfand, Y. Manin, {\it Methods of homological algebra}, Springer\\
David Eisenbud, {\it Commutative algebra}, GTM 150, Springer\\

\subsection{categories and functors}
In this section, we are going to define some basic notions.

\begin{defn}
A {\bf category} is a class $\mc C$ of objects, denoted
$A,B,C,...,$ etc., together with
\begin{enumerate}
\item  a class of disjoint set, denoted $\Hom_{\mc C}(A,B)$,
called {\bf morphism} and
 \item  for each triple $(A,B,C)$ of
objects a function $Hom(B,C) \times \Hom(A,B) \to \Hom(A,C)$,
called the {\bf composition} subjects to
\begin{enumerate}
\item $h \circ (g \circ f) = (h \circ g ) \circ f$.
 \item for each object $A \in \mc C$, there exists $\id_A \in \Hom(A,A)$ such that $ \id_A
\circ f = f, f \circ \id_A = f$.
\end{enumerate}
\end{enumerate}
\end{defn}

\begin{ex}
\end{ex}
\begin{enumerate}
\item The category of Sets, denoted $ {\it Set}$.

\item The category of groups, denoted $ {\it Gp}$, is a
subcategory of ${\it Set}$.

\item The category of abelian groups, denoted ${\it Ab}$, is a
subcategory of ${\it Gp}$.
\end{enumerate}

\begin{defn} Let $\mc C, \mc D$ be  categories. A {\it covariant
functor} (resp. {\it contravariant functor}) $F$ of $\mc C$ to
$\mc D$ is a rule which to each object $A \in \mc C$ associate an
object $F(A) \in \mc D$, and to each morphism $f: A \to B$
associate a morphism $F(f): F(A) \to F(B)$ (resp. $F(f): F(B) \to
F(A)$) such that:
\begin{enumerate}
\item $F(\id_A)= \id_{F(A)}$. \item $F(g\circ f) = F(g) \circ
F(f)$ (resp. $F(g\circ f) = F(f) \circ F(g)$).
\end{enumerate}

\end{defn}

There are many cases we met the {\it universal property}. This can
be seen via the universal object in a suitable category.

\begin{defn}
In a category $\mc C$, an object $P$ is said to be universally
attracting (resp. repelling) if $\Hom(A,P)$ (resp. $\Hom(P,A)$)
has only one element for all $A \in \mc C$.
\end{defn}

\begin{ex}\end{ex} The group of one element is the universally
repelling and attracting object in $Gp$.

\begin{ex}\end{ex} Fixed a set $S$. Let $\mc C$ be the category of maps
form $S$ to abelian groups. The free abelian group is the
universally repelling object.

Similarly, if we consider the category of maps from $S$ to groups.
Then we get free group by considering the universal repelling
object. \qed

\begin{ex}\end{ex} In a category $\mc C$, the product of $A,B$ can
be defined as $(P,f,g)$ consisting of an object $P$ and $f: P \to
A$, $g: P \to B$ such that for any $(C,s,t)$, there exist a unique
$h: C \to P$, which makes the diagram commute.

In other words, let $\mc D $ be the category of the triple
$(C,s,t)$, then $P$ is nothing but the universal attracting
object. \qed

We now formulate the axioms of {\bf additive category} and {\bf
abelian category}.

{\bf A1.} $\Hom(A,B)$ is an abelian group. And composition is
bilinear.

{\bf A2.} There exist a zero object $0$, i.e. such that
$\Hom(0,A), \Hom(A,0)$ has precisely one element.

{\bf A3.} Finite direct sum and finite direct product exist. In
other words, for $A_1,A_2 \in \mc C$, there exist an object $C \in
\mc C$ and $p_i: C \to A_i$, $\imath_i:A_i \to C$ such that $p_i
\imath_i = \id_{A_i}$, $p_i \imath_j =0$ if $i \ne j$, $\imath_1
p_1 + \imath_2 p_2 = \id_{C}$.

{\bf A4.} For any morphism $f: A \to B$, there exist a sequence,
called a {\it canonical decomposition}
$$ K \stackrel{k}{\to} A \stackrel{\imath}{\to} I
\stackrel{\jmath}{\to} B \stackrel{c}{\to} K'$$ such that
\begin{enumerate}
\item $\jmath \circ \imath = f$ \item $K$ is the kernel of $f$ and
$K'$ is the cokernel of $f$. \item $I$ is cokernel of $k$ and
kernel of $c$.
\end{enumerate}

In the above canonical decomposition, $K$ can be viewed as kernel,
$I$ as the image and $K'$ as the cokernel.

\begin{defn}
A category satisfying $A1,A2,A3$ is called an additive category.
An additive category satisfying $A4$ is called an abelian
category.
\end{defn}

\begin{rem}
The kernel and cokernel should be defined abstractly. For example,
given $A \in \mc C$, one can define a functor $h_A: \mc C ^\circ
\to Set$ such that $h_A(C) = \Hom(C,A)$. A functor $F$ is {\bf
representable} by $B$ is $F \cong h_B$.

In an additive categoty $\mc C$, for a morphism $f: A \to B$, one
can define a kernel functor   $Ker(f):\mc C^\circ \to Ab$ such
that $Ker(f) (C) = Ker( h_A(C) \to h_B(C))$.

We say  that kernel of $f$ exists if the functor $Ker(f)$ is
representable.

Cokernel can be defined similarly but a little bit subtle. It's
$ker( f^\circ)^\circ$.
\end{rem}

\begin{ex}
\end{ex}
The followings are abelian categories:
\begin{enumerate}
\item ${\it Ab}$. \item category of $R$-modules, where $R$ is a
ring. \item category of finite dimensional vector space over $k$.
\item category of sheaves of abelian groups over a topological
space.
\end{enumerate}
\qed


\subsection{complexes, examples of homology and cohomology groups}
There are various situation where we need to consider a sequence
of abelian group. This is basically why homological algebra arise.

\begin{defn}
Let $\mc A$ be an abelian category. A comlpex
$K^\bullet=(K^i,d_i)_{i \in \mb Z}$ consists of $K^i \in \mc A$,
$d^i: K^i \to K^{i+1}$ such that $d^{i+1}d^i=0$ for all $i$.

A complex is said to be exact if $\ker(d^{i+1}) = \im(d^{i})$.
\end{defn}


\begin{ex} [Homology of simplicial complex] \end{ex}
Given a simplicial complex $X$, we can view it as $\cup X_n$,
where $X_n$ denotes the $n$-skeleton. To each $n$, we attach a
free abelian $C_n$ on $n$-simlpex. Note that there is a natural
{\it boundary map} $\partial_n$ from a $n$-complex to $(n-1)-$
complex. Note that one need to handle signs by considering the
orientation. It follows that $\partial \circ \partial =0$. Hence
we have a complex of free abelian groups $ (C_n,
\partial)$.

The homology can be considered as the obstruction of this complex
being exactness. That is, $H_i(X,\mb Z):= \ker (\partial_n)/
\im(\partial_{n-1})$.

For example, the homology of $S^2$ can be realized by
$$ 0 \to \mb Z [f]  \to \mb Z [e_1] \oplus \mb Z [e_2] \to \mb
Z[x_1] \oplus \mb Z [x_2] \oplus \mb Z[x_3] \to 0.$$ And $\partial
[f] = [e_1]+[e_2] -[e_2] -[e_1], \partial [e_1] = [x_2]-[x_1],
\partial[e_2] = [x_3]-[x_2], \partial[x_i]=0$.
Therefore, $H_2(S^2) \cong \mb Z$, $H_1 \cong 0$, $H_0 \cong \mb
Z$. \qed

\begin{exer} compute the homology of  $ S^n, \mb {RP}^2, T^2$ and Klein bottle.
\end{exer}


\begin{ex}\end{ex} [differential forms, De Rham complex and cohomology]
Let $X$ be a differentiable manifold, e.g $\mb R^n$. Let $C^i$ be
the vector space of $\mc C^\infty $ $i$-forms on $X$. There is the
natural differential $d: C^i \to C^{i+1}$. Then we have a complex
$(C^i, d)$, called the de Rham complex. Similarly, we have de Rham
cohomology $H^i:= \ker(d^i)/ \im (d^{i-1})$. \qed

\begin{ex} [Koszul complex, free resolution] \end{ex}
Given a ring $R= k[x,y,z,w]/(xz-y^2,xw-yz,yw-z^2).$ How can we
realize it via describing generators and relations?

Let $S= k[x,y,x]$, then there is an exact sequence
$$ 0 \to \oplus S^2 \to  \oplus^3 S \stackrel{(xz-y^2,xw-yz,yw-z^2)}{\longrightarrow} S \to R
\to 0.$$ So the ring $R$ can be realized as the complex of free
modules. This is an example of so-called {\it free-resolution}.
\qed

What we would like to do is more or less the algebraic structure
needed for this kind of situation.

\vfill \pagebreak
\begin{center}
Jan. 5, 2007
\end{center}
\subsection{complexes, exact sequences}
.


\begin{defn}
By a short exact sequence, we mean an exact sequence $0 \to A \to
B \to C \to 0$.
\end{defn}

\begin{ex}\end{ex}
\noindent $1.$ Let $A,B$ be abelian groups, then we have exact
sequence:
$$ 0 \to A \stackrel{\imath_A}{\to} A \oplus B \stackrel{p_B} \to B \to 0.$$

\noindent $2.$ Let $A \lhd B$ be abelain groups, then we have
exact sequence:
$$ 0 \to A \to B \to B/A \to 0.$$

\noindent $3.$ Let $\varphi: B \to C $ be a surjective
homomorphism, then we have exact sequence:
$$ 0 \to \ker(\varphi) \to B \to C \to 0.$$
\qed

Given a  long exact sequence $K^\bullet=(K^i,d_i)$, it  can be
decomposed into short exact sequences $$0 \to \ker(d^i)=
\im(d^{i-1}) \to K^i \to \im(d^i)= \ker(d^{i+1}) \to 0.$$

Therefore, short exact sequences play the most important role in
our studies.

Given a morphism $\phi \in \Hom(K^\bullet,L^\bullet)$ of
complexes, one can define its  kernel, image, cokernel, in a
natural way. Thus we can formulate a new category $Kom(\mc A)$,
whose objects are complexes over $\mc A$ and morphisms are
morphism of complexes.

\begin{exer}
 $Kom(\mc A)$ is an abelian category in which $\mc A$ is a subcategory.
\end{exer}

Let $K^\bullet$ be a complex. We let $Z^i := \ker(d^i)$, called
the $i$-{\bf th cocycle} and $B^i:= \im (d^{i-1})$, called the
$i$-{\bf th coboundary}. Then $H^i(K^\bullet):= Z^i/B^i$ is called
the $i$-{\bf th cohomology} of $K^\bullet$. Cohomology can be
viewed as a tool detecting the non-exactness of complexes.

Given two complexes $K^\bullet, L^\bullet$, a  morphism of
complexes $\phi \in Hom_{\mc A} (K^\bullet, L^\bullet)$ consists
of morphisms $ \phi^i: K^i \to L^i$ such that $ \phi^{i+1} \circ
d^i_K = d^i_L \circ \phi^{i}$ for all $i$. Another way to put it
is the following diagram commute:

$$\begin{CD}
 @>>> K^i @>{d_K^i}>> K^{i+1} @>>> @. \\
@. @V{\phi^i}VV @V{\phi^{i+1}}VV @. \\
@>>> L^i @>{d_L^i}>> L^{i+1} @>>> @.
\end{CD}
$$

One can easily checked that there is an induced map $H^i(\phi):
H^i(K^\bullet) \to H^i(L^\bullet)$ for all $i$. Moreover, if
$\phi, \psi$ are morphism of complexes, then $H^i(\psi) \circ
H^i(\phi) = H^i (\psi \circ \phi)$ for all $i$ whenever it make
sense.

Before we move on, we discuss the following useful lemmas:

\begin{lem}[Snake Lemma] Given a diagram
$$ \begin{CD}
@. A' @>{f}>> A @>>> A'' @>>> 0 \\
@. @V{d'}VV @V{d}VV @V{d''}VV @. \\
0 @>>> B' @>>> B @>{g}>> B'' @.
\end{CD}
$$ with each rows are exact.  Then there is a well-defined map $\delta: \ker(d'') \to \coker(d')$
such that we have an exact sequence
$$ \ker(d') \stackrel{f}{\to} \ker(d) \to \ker(d'') \stackrel{\delta}{\to}
\coker(d') \to \coker(d) \stackrel{\bar{g}}{\to} \coker(d'').$$

If moreover that $f: A' \to A$ is injective, then $f: \ker(d') \to
\ker(d)$ is injective. And if $g: B \to B''$ is surjective, then
$\bar{g}:\coker(d){\to} \coker(d'')$ is surjective.
\end{lem}

\begin{proof} The proof consists of various diagram chasing. We
leave it to the reader.
\end{proof}

\begin{cor}
Keep the notation as above. If both $d',d''$ are injective (resp.
surjective) then so is $d$.

Assume that $f$ is injective and $g$ is surjective. If any two of
$d',d,d''$ are isomorphism. So is the third one.
\end{cor}

\begin{lem}[Five Lemma] Given a diagram
$$ \begin{CD}
A_1 @>>> A_2 @>>> A_3 @>>> A_4 @>>> A_5 \\
@V{d_1}VV @V{d_2}VV @V{d_3}VV @V{d_4}VV @V{d_5}VV \\
B_1 @>>> B_2 @>>> B_3 @>>> B_4 @>>> b_5
\end{CD}
$$ with each rows are exact.

If $d_1$ is surjective (resp. injective) and $d_2,d_4$ are
injective (resp. surjective), then $d_3$ is injective (resp.
surjective).

In particular, if $d_1,d_2,d_4,d_5$ are isomorphic, then so is
$d_3$.
\end{lem}

\begin{proof}
Decompose the sequence into short exact sequences.
\end{proof}

An immediate application is the following:
\begin{prop}
Given an exact sequence $0 \to A \stackrel{f}{\to} B
\stackrel{g}{\to} C \to 0$, the following are equivalent:
\begin{enumerate}
\item there is $h: C \to B$ such that $gh= \id_C$.

\item there is $l: B \to A$ such that $l f = \id_A$.

\item the sequence is isomorphic to $ 0 \to A
\stackrel{\imath_A}{\to} A \oplus C \stackrel{p_C}{\to} C \to 0$.
\end{enumerate}
Such sequence is called {\bf split}.

If the sequence split, then in particular, $B \cong A \oplus C$.
\end{prop}

\begin{proof}
Given $h: C \to B$, we can construct the following commutative
diagram:
$$ \begin{CD}
0 @>>> A @>{\imath_A}>> A \oplus C @>{p_C}>> C @>>> 0 \\
@VVV @V{\id_A}VV @V{f p_A+h p_C}VV @V{\id_C}VV @VVV \\
0 @>>> A @>{f}>> B @>{g}>> C @>>> 0 \\
\end{CD}
$$
By Five Lemma, $f p_A+h p_C $ is an isomorphism. Hence those two
sequences are isomorphic.

On the other hand, if the two sequence are isomorphic. That is we
have the following commutative diagram, which is invertible:
$$ \begin{CD}
0 @>>> A @>{\imath_A}>> A \oplus C @>{p_C}>> C @>>> 0 \\
@. @V{\id_A}VV @V{\phi}VV @V{\id_C}VV @.\\
0 @>>> A @>{f}>> B @>{g}>> C @>>> 0 \\
\end{CD}
$$

 Let $h= \phi
\circ \imath_C: C \to B$, then $gh=g \phi \imath_C =\id_C p_C
\imath_C =\id_C $.

The proof for other equivalence is similar.
\end{proof}


\begin{thm}
Given a short exact of complexes, then it induces a long exact
sequences of cohomology.
\end{thm}

\begin{proof}
This can be proved directly, or by Snake Lemma.

We briefly sketch the proof by using Snake Lemma here.

First look at the diagram
$$ \begin{CD}
0 @>>> A^{i-1} @>>> B^{i-1} @>>> C^{i-1} @>>> 0 \\
@. @VVV @VVV @VVV @. \\
0 @>>> A^{i} @>>> B^{i} @>>> C^{i} @>>> 0 \\
\end{CD}
$$

Then we have exact sequence $ A^i/B^i(A^\bullet) \to
B^i/B^i(B^\bullet) \to C^i/B^i(C^\bullet) \to 0$ by looking at
cokernel of the maps.

Next we look at the diagram
$$ \begin{CD}
0 @>>> A^{i+1} @>>> B^{i+1} @>>> C^{i+1} @>>> 0 \\
@. @VVV @VVV @VVV @. \\
0 @>>> A^{i+2} @>>> B^{i+2} @>>> C^{i+2} @>>> 0 \\
\end{CD}
$$

Then we have exact sequence $ 0 \to Z^{i+1}(A^\bullet) \to
Z^{i+1}(B^\bullet) \to Z^{i+1}(C^\bullet)$ by looking at kernels.

These two exact sequences fit into a commutative diagram
$$ \begin{CD}
 @.  A^i/B^i(A^\bullet) @>>>
B^i/B^i(B^\bullet) @>>> C^i/B^i(C^\bullet) @>>> 0 \\
@. @V{\bar{d}_A^i}VV @VVV @VVV@. \\
0 @>>> Z^{i+1}(A^\bullet) @>>> Z^{i+1}(B^\bullet) @>>>
Z^{i+1}(C^\bullet) @.
\end{CD}
$$

One can check that $\ker ({\bar{d}_A^i} ) = H^i(A^\bullet)$ and
$\coker ({\bar{d}_A^i} ) = H^{i+1} (A^\bullet)$. And similarly for
$B^\bullet$ and $C^\bullet$. Hence by Snake Lemma, we are done.
\end{proof}

\begin{defn}
Let $F: \mc A \to \mc B$ be a functor between two abelian
categories. We say that $F$ is {\bf exact} if for an exact
sequence $K^\bullet$ over over $\mc A$, $F(K^\bullet)$ is exact
over $\mc B$.
\end{defn}

\begin{exer}
Show that $F$ is exact if and only if for any short exact sequence
$ 0\to A \to B \to C \to 0$ in $\mc A$, the induced sequence $0
\to F(A) \to F(B) \to F(C) \to 0$ is exact in $\mc B$.
\end{exer}

\begin{defn}
Keep the notation as above. We say that $F$ is left-exact (resp.
right-exact) if for any short exact sequence $ 0\to A \to B \to C
\to 0$ in $\mc A$, the induced sequence $0 \to F(A) \to F(B) \to
F(C)$ (resp. $F(A) \to F(B) \to F(C) \to 0$) is exact in $\mc B$.
\end{defn}

Unfortunately, most natural functors are left-exact (or
right-exact) but not exact. We list some of them:

\begin{ex} \end{ex} Let $X$ be a topological space. Let $Sh_X$ be
the category of sheaves on $X$, which is an abelian category. The
global section functor $\Gamma(X, \cdot) : Sh_X \to Ab$ is left
exact but not exact. \qed

\begin{ex} \end{ex} Let $Ab$ be the category of abelian groups.
Fixed $M \in Ab$, we consider $ \Hom(M. \cdot) : Ab \to Ab$ by $ A
\mapsto \Hom(M,A)$. This is left-exact but not right exact. \qed

It is natural to ask what the defect of these functors. Which will
be realized in the next section


\vfill \pagebreak
\begin{center}
Jan. 12, 2007
\end{center}
\subsection{injective}
In this section, we are going to define injective objects. Then
one has injective resolution if the category has enough
injectives. Moreover, we will see that injective resolution are
convenient for handling left exact but not exact functors.

\begin{defn}
Let $\mc A$ be an abelian category.
 An object $I \in \mc A$ is injective if
 for all $0 \to A \to B$ and $A \to I$, there exists $B \to I$
makes the diagram commute.
\end{defn}

\begin{prop}
$I$ is injective if and only if the functor $M \mapsto Hom_{\mc
A}(M,I)$ is exact.
\end{prop}


\begin{proof}
For every exact sequence $0 \to A \to B \to C \to 0$, we have
exact sequence
$$\Hom(A,I) \leftarrow \Hom(B,I) \leftarrow \Hom(C,I)\leftarrow
0.$$ The definition of injective says nothing more than that
$\Hom(B,I) \to \Hom(A,I)$ is surjective.
\end{proof}

\begin{exer} If $I$ is injective, then every sequence $ 0 \to I \to B \to C \to 0$ splits.
\end{exer}

An abelian category $\mc A$ is said to have {\bf enough
injectives} if for every $A \in \mc A$, there exist an injective
object $I \in \mc A$ and an injection $0 \to A \to I$.

Suppose now that $\mc A$ has enough injectives. Then for every $A
\in A$, one has $0 \to A \stackrel{\imath}{\to} I^0$ for some
injective $I^0$. Next look at $\coker(\imath)$, one has $ 0\to
\coker(\imath) \to I^1$ for some injective $I^1$ and let $d^0: I^0
\to I^1$ be the composition map. Inductively, we obtained a
sequence $$ 0 \to A \to I^0 \to I^1 ...$$ It's easy to see that
it's an exact sequence because it patches short exact sequences $
0\to \coker(\imath_{j-1}) \stackrel{\imath_j}{\to} I^j  \to
\coker(\imath_{j}) \to 0$.

Before we move on, it worthwhile to think what indeed injective
object is and why we expect an abelian category has enough
injectives.

Let $Ab$ be the abelian category of abelian groups. A group $G$ is
said to be {\bf divisible} if $m : G \to G$ by $m: x \mapsto mx$
is surjective for all $m \ne 0 \in \mb Z$. In other words, for
$x\in G$, and for all $m \ne 0 \in \mb Z$, there is $y \in G$ such
that $ny=x$. We will show that in $Ab$:
\begin{lem} \label{div2inj} $G$ is divisible, then $G$ is injective.
\end{lem}
\begin{lem} \label{emb2div} Every abelian group can be embedded into a
divisible group.
\end{lem}
 Thus the abelian category $Ab$ has
enough injective. It also follows that those natural abelian
categories, such as category of $R$-modules, category of sheaves
of abelian groups, has enough injective.

In order to prove the Lemmata, we observe that:
\begin{enumerate}
\item if $G$ is divisible, so if $G/N$ for any normal subgroup
$N$.

\item if $G_i$ are divisible for all $i$, then $\sum_{i \in I}
G_i$ is divisible.
\end{enumerate}

\begin{proof}[proof of \ref{div2inj}]
Suppose that $G$ is divisible and $ 0\to A' \to A$ is exact with a
map $f': A' \to G$. We need to show that there is $f: A \to G$
extending $f'$.

We shall use Zorn's Lemma. Let $\Sigma = \{ (B,g)| A' < B < A, g:B
\to G, g|_{A'}=f' \}$. There exists a maximal element $(M,h)$ in
$\Sigma$. One verifies that $M=A$.
\end{proof}

\begin{proof}[proof of \ref{emb2div}]
$ G \cong F/K$, $F \cong \sum_{x \in I} \mb Z x$. $F
\stackrel{f}{\hookrightarrow} \sum_{x \in I} \mb Q x$. $G \cong
F/K \cong f(F)/f(K) <\sum_{x \in I} \mb Q x / f(K)$ is divisible.
\end{proof}


\begin{lem}
Let $I^\bullet$ be an injective resolution of $A$ and $J^\bullet $
an injective resolution of $B$. If there is $\varphi: A \to B$, then
there exists $f: I^\bullet \to J^\bullet$ compatible with $\varphi$.

Moreover any two such $f,g : I^\bullet \to J^\bullet $ are
homotopic.
\end{lem}

\begin{defn}
$f ,g \in  \Hom(\cx K, \cx L)$ are homotopic if there are $h^i:
K^i \to L^{i-1}$ such that $ d_Lh+hd_K= f-g$.
\end{defn}

Injective resolution is very useful in the study of left exact
functors which is not exact. More, precise the following Lemma show
that injective rsln splits

\begin{lem}
Given $ 0 \to A \to B \to C \to 0$, there is an exact sequence of
complexes $0 \to I^\bullet \to J^\bullet \to K^\bullet \to 0$ such
that $\cx I$ (resp, $\cx J, \cx K$) is an injective resolution of
$A$ (resp. $B,C$). Moreover, $J^i = I^i \oplus K^i$.
\end{lem}

\begin{proof}
We define $I^0, K^0$ first. Then there is a natural map $B \to
J^0:=I^0 \oplus K^0$. This map is injective.

Then inductively, we get the resolutions.
\end{proof}
Warning: $J$ is not $I \oplus K$ as complex. For example, the map
$I^0 \oplus K^0 \to I^1 \oplus K^1$ is of the form $(d_I(i^0)+*,
d_K(k^0))$ where  $*$ is not necessarily zero.

We are now ready to study the left-exact functors. Apply $F$ to
$$
\begin{CD}
0  @>>> A @>>> B @>>> C @>>> 0 \\
@. @VVV @VVV @VVV @. \\
0 @>>> I^\bullet @>>> \cx J @>>> \cx K @>>> 0
\end{CD}
$$
We get
$$
\begin{CD}
0  @>>> F(A) @>>> F(B) @>>> F(C) @. @. \\
@. @VVV @VVV @VVV @. \\
0 @>>> F(I^\bullet) @>>> F(\cx J) @>>> F(\cx K) @>>> 0
\end{CD}
$$
Notice that the bottom row is exact because $J^i = I^i \oplus K^i$
by our construction, hence $F(J^i)= F(I^i) \oplus F(K^i)$ for all
$i$.

\begin{prop}
Let $R^iF(A) := H^i( F( \cx I))$. Then we have: \\
\begin{enumerate}
\item $R^0F(A) =A$.

\item there is a long exact sequence $$ 0 \to F(A) \to F(B) \to
F(C) \to R^1F(A) \to R^1F(B) \to ...$$
\end{enumerate}
\end{prop}

\begin{proof}
It's easy to see that $\ker ( F(I^0) \to F(I^1)) \cong F(A)$ by
the left exactness. And the second statement follows from the long
exact sequence of cohomology of short exact sequence of complexes.
\end{proof}

\begin{exer}
Show that $R^iF(A)$ is well-defined. That is, independent of
choice of injective resolution.
\end{exer}
\subsection{derived category}
In this section, we are going to describe derived category
briefly. It's a category over which cohomology theory can be
defined and convenient to operate.
\begin{exer}
If $h$ is homotopic to $0$, denoted  $h \sim 0$, then $f h \sim
0$, $h g \sim 0$ for all $f ,g$ whenever it makes sense.
\end{exer}

So we can think of the class of homotopic equivalence as an ideal.

Let $\mc K(\mc A)$ be the category whose objects are complex in
$\mc A$ and morphisms are morphism in $\mc A$ quotient homotopic
equivalence. More precisely, $\Hom_{\mc K(\mc A)}( \cx K, \cx L)$
consists of homotopic equivalent class of $\Hom_{Kom (\mc A)} (
\cx K, \cx L)$.

Then in $\mc K ( \mc A)$, injective resolution is unique (up to
isomorphism).

\begin{defn}
Given a complex $\cx K = (K^i, d_K^i)$, we define $ \cx {K[n]}$
such that $K[n]^i=K^{n+1}, d_{K[n]}^i = (-1)^n d_K^{n+i}$.

And given a morphism $f:\cx K \to \cx L$, we define a complex $\cx
{C(f)}$, called the {\bf mapping cone of $f$}, by $C(f)^i =
K^{i+1} \oplus L^i$ and $d_C^i ( k^{i+1}, l^i) = ( -
d_K^{i+1}(k^{i+1} ), f(k^{i+1})+d_L^i(l^i))$.
\end{defn}

\begin{ex}\end{ex} If $\cx K = K, \cx L =L$, then $C(f) = 0 \to K
\to L \to 0$. \qed

\begin{ex} \end{ex} If $f =0$, then $C(f)= \cx K \oplus \cx L$.

\begin{defn}
Given a morphsim $ f: \cx K \to \cx L$, we define a complex $\cx {
Cyl(f)} $ such that $Cyl(f)^i = K^i \oplus K^{i+1} \oplus L^i$.
And $d_{Cyl}^i (k^i, k^{i+1},l^i)= (d_K k^i- k^{i+1}, - d_K
k^{i+1}, f(k^{i+1})+d_L l^i)$.
\end{defn}

\begin{thm}
We have the following diagram
$$
\begin{CD}
@. 0 @>>> \cx L @>>> \cx{C(f)} @>{\delta}>> \cx {K[1]} @>>> 0 \\
@. @. @V{\alpha}VV @VVV @. @. \\
0 @>>>  \cx K @>{\bar{f}}>> \cx {Cyl(f) } @>{\pi}>> \cx{C(f)} @>>> 0 @. \\
@. @V{=}VV @V{\beta}VV @. @. @. \\
@. \cx K @>{f}>> \cx L @. @. @.
\end{CD}
$$
Such that each row is exact. $\alpha, \beta$ are
quasi-isomorphisms. Moreover, $\beta \alpha = \id_{ L}$ and
$\alpha \beta \sim \id_{Cyl(f)}$.
\end{thm}

\begin{proof} All the above maps are the natural ones. One has to check that all the
maps indeed gives morphism of complexes and the diagram commutes.
We leave the detail to the readers.

 The homotopy is defined by
$h^i(k^i,k^{i+1},l^i)=(0,k^i,0)$.
\end{proof}

\begin{thm} Given an exact sequence $0 \to \cx K \to \cx L \to \cx M \to 0$, we have the following commutative diagram with
each vertical map being quasi-isomorphic.
$$ \begin{CD}
0 @>>> \cx K @>f>> \cx L @>g>> \cx M @>>> 0 \\
@. @AAA @A{\beta}AA @A{\gamma}AA @. \\
0 @>>>  \cx K @>{\bar{f}}>> \cx {Cyl(f) } @>{\pi}>> \cx{C(f)} @>>> 0 @. \\
\end{CD} ,$$
where $\gamma(k^{i+1},l^i)=g(l^i)$.

The second row is called {\bf distinguished triangle}.

\end{thm}

Derived category $D(\mc A)$ is the category localizing $\mc K (\mc
A)$ with respect to quasi-isomorphisms. That is, a morphism
$\Hom_{D(\mc A)}(X , Y)$ in $D(\mc A)$ is a roof $(t,f)$ where $t:
\cx Z \to \cx  X$ is a quasi-isomorphism and $f: \cx Z \to \cx Y $
is a morphism in $\mc K (\mc A)$. Then in this setting, a
quasi-isomorphism $s: \cx X \to \cx Y$ has inverse $(s, \id_X) \in
\Hom_{D(\mc A)}(\cx Y, \cx X)$.

Derived category has the universal property that  any functor $F:
Kom(\mc A) \to \mc D$ sending quasi-isomorphism into isomorphism
can be uniquely factored through $D(\mc A)$.

Note that a cohomology (homology) theory  on $\mc A$ is nothing
but a functor $F: Kom(\mc A) \to Kom(Ab)$ and thus factors through
derived category.

\end{document}
\end

