\documentclass[a4paper]{article}
\usepackage[unicode,colorlinks=true,linkcolor=blue]{hyperref}
% \usepackage{bookmark}
% \usepackage{parskip}
\usepackage{booktabs}
\usepackage{amssymb}

% It is possible to use 8-bit Greek text fonts in the LGR TeX font encoding
% also with XeTeX/LuaTeX, if the »fontenc« package is loaded before
% »fontspec« and »textalpha«:
\usepackage[LGR]{fontenc}

% Unicode font setup:
\usepackage{fontspec}
% \setmainfont{DejaVu Serif}
% \setsansfont{DejaVu Sans}
% \usepackage{libertineotf}
% \setmainfont{Linux Libertine O}
\setsansfont{Linux Biolinum O}
% \setmainfont{cmunrm.otf} % CMU Serif % many missing characters :(
\setmainfont{FreeSerif}%
% \setmainfont{Droid Sans}

% Declare the font encoding and Greek LICR definitions:
\usepackage[normalize-symbols]{textalpha}

% For the new \MakeUppercase, we need to set the text language to Greek
% with Babel or polyglossia:
\usepackage[greek,english]{babel}

% select the LGR font encoding and CB fonts
\providecommand*{\lgrfont}[1]{\leavevmode{%
  \fontfamily{cmr}\fontencoding{LGR}\selectfont#1}%
}

\newcommand{\pkgref}[1]{\emph{\href{https://ctan.org/pkg/#1}{#1}}}


\begin{document}

\title{Font setup for Greek with XeTeX/LuaTeX}
\author{Günter Milde}
\date{2020/10/30}
\maketitle

\noindent The file \href{tuenc-greek.def.html}{tuenc-greek.def} provides
support for Greek \hyperref[licr]{LICR} macros and upcasing of text with
XeTeX and LuaTeX. It is loaded automatically by
\href{textalpha-doc.pdf}{\emph{textalpha}},
\href{alphabeta-doc.pdf}{\emph{alphabeta}},
and \pkgref{babel-greek} when used with Unicode fonts
(LuaTeX or XeTeX with \pkgref{fontspec}).

\tableofcontents

\section{Requirements}

\subsection{\emph{fontspec} and suitable Unicode fonts}

LaTeX sets up the TU Unicode text font encoding if it detects the XeTeX or
LuaTeX engines. The user must ensure that the selected font contains Greek
glyphs (the default Latin Modern fonts have only capital Greek letters).
\textbf{There are no errors for missing glyphs}, just warnings in the log
file (but not in the console output) and empty spaces in the output
document.

The \pkgref{fontspec} package is the standard tool to select fonts in
XeTeX/LuaTeX. \pkgref{babel} provides a front-end to set
up language-specific fonts with the \verb|\babelfont| command.

\section{Usage}

\texttt{tuenc-greek.def} is loaded automatically by
\href{textalpha-doc.pdf}{\emph{textalpha}},
\href{alphabeta-doc.pdf}{\emph{alphabeta}}, or \pkgref{Babel} (with the
language option \href{https://ctan.org/pkg/babel-greek}{greek}) if these
packages are used with Unicode-aware TeX engines (XeTeX or LuaTeX). This
provides support for Greek LICR input and fixes for MakeUppercase.
The \verb|\MakeUppercase| implementation introduced in the 2022/06 LaTeX
release uses Greek upcasing rules only for text parts with the
\pkgref{babel} language \texttt{greek} and ignores the changes to
\texttt{uccode} values done in this package.


\section{LICR input%
         \label{licr}}

The LaTeX internal character representation (LICR) is a verbose,
fail-safe 7-bit ASCII encoding that can be used unaltered under both, 8-bit
TeX and XeTeX/LuaTeX. Use cases are macro definitions and generated text.

See the source of this document,
\href{test-tuenc-greek.tex}{\texttt{test-tuenc-greek.tex}} for the input used
in the examples below.

\subsection{Greek alphabet}

Greek letters via LICR macros:
\begin{quote}
  \textAlpha{} \textBeta{} \textGamma{} \textDelta{} \textEpsilon{}
  \textZeta{} \textEta{} \textTheta{} \textIota{} \textKappa{}
  \textLambda{} \textMu{} \textNu{} \textXi{} \textOmicron{} \textPi{}
  \textRho{} \textSigma{} \textTau{} \textUpsilon{} \textPhi{}
  \textChi{} \textPsi{} \textOmega{}

  \textalpha{} \textbeta{} \textgamma{} \textdelta{} \textepsilon{}
  \textzeta{} \texteta{} \texttheta{} \textiota{} \textkappa{}
  \textlambda{} \textmu{} \textnu{} \textxi{} \textomicron{} \textpi{}
  \textrho{} \textsigma{} \texttau{} \textupsilon{}
  \textphi{} \textchi{} \textpsi{} \textomega{}
\end{quote}
The small sigma is set with a different
glyph if it ends a word:
\begin{quote}
  \textsigma{}       \verb|\textsigma|\\
  \textfinalsigma{}  \verb|\textfinalsigma| or \verb|\textvarsigma|
\end{quote}
The \verb|\textautosigma| currently works only with 8-bit LGR fonts:
\textautosigma\textiota{} vs. \textiota\textautosigma.


\subsection{Diacritics}

Greek diacritics can be input by named macro or symbol macro:
\begin{quote}
  \acctonos\textalpha       \'\textalpha{}  \acctonos       x\'x
  \accvaria\textalpha       \`\textalpha{}  \accvaria       x\`x
  \accdialytika\textiota    \"\textiota{}   \accdialytika   x\"x
  \accperispomeni\textalpha \~\textalpha{}  \accperispomeni x\~x
  \accpsili\textalpha       \>\textalpha{}  \accpsili       x\>x
  \accdasia\textalpha       \<\textalpha{}  \accdasia       x\<x
\end{quote}
%
XeTeX and LuaTeX (since 2022) normalise base letter and combining diacritics
to the corresponding pre-composed character (if such character exists in the
\emph{Greek and Coptic} or \emph{Greek Extended} Unicode Blocks).


\begin{quote}
  % άάὰὰϊϊᾶᾶἀἀἁἁ
  \acctonos α       \'α
  \accvaria α       \`α
  \accdialytika ι   \"ι
  \accperispomeni α \~α
  \accpsili α       \>α
  \accdasia α       \<α
\end{quote}

\subsubsection{perispomeni vs. tilde}

The Greek \emph{perispomeni} has the look of a tilde but the semantic of
a circumflex accent. The Unicode standard provides distinct code points.
Only <Greek letter> + COMBINING GREEK PERISPOMENI is considered equivalent
to the pre-composed character <Greek letter> WITH PERISPOMENI.

The ``named'' \verb|\accperispomeni| macro uses COMBINING GREEK PERISPOMENI,
while the standard tilde-accent macro \verb|\~| uses the COMBINING TILDE.
Composite definitions for \verb|\~| select the pre-composed character:

\begin{quote}
  \~α = ᾶ, \~η = ῆ, \~ι = ῖ, \~υ = ῦ, \~ω = ῶ
\end{quote}


\subsubsection{combined diacritics}

Combined accents are defined using combining diacritical characters.

\begin{quote}
\accdialytikatonos\textiota{}     \"'\textiota{} \"\'\textiota{}
\accdialytikatonos x              \"'x           \"\'x
\accdialytikavaria\textiota{}     \"`\textiota{} \"\`\textiota{}
\accdialytikavaria x              \"`x           \"\`x
\accdialytikaperispomeni\textiota{} \~"\textiota{} \~\"\textiota{}
\accdialytikaperispomeni x        \~"x           \~\"x

\accdasiaoxia\textiota{}          \<'\textiota{} \<\'\textiota{}
\accdasiaoxia x                   \<'x           \<\'x
\accdasiavaria\textiota{}         \<`\textiota{} \<\`\textiota{}
\accdasiavaria x                  \<`x           \<\`x
\accdasiaperispomeni\textiota{}   \~<\textiota{} \~\<\textiota{}
\accdasiaperispomeni x            \~<x           \~\<x

\accpsilioxia\textiota{}          \>'\textiota{} \>\'\textiota{}
\accpsilioxia x                   \>'x           \>\'x
\accpsilivaria\textiota{}         \>`\textiota{} \>\`\textiota{}
\accpsilivaria x                  \>`x           \>\`x
\accpsiliperispomeni\textiota{}   \~>\textiota{} \~\>\textiota{}
\accpsiliperispomeni x            \~>x           \~\>x
\end{quote}
Composite diacritics overlap when they are not normalised to a pre-composed
character. However, this is not a major problem in normal use as
pre-composed characters exist in Unicode for all letters that are
used with diacritics in (ancient, polytonic or monotonic) Greek.

\subsubsection{sub-iota}

The sub-iota is input after the base letter.

\begin{itemize}
\item
  \verb|\ypogegrammeni| sets a COMBINING GREEK YPOGEGRAMMENI:
  \textalpha\ypogegrammeni{} k\ypogegrammeni{}.

  A Greek capital letter followed by COMBINING GREEK YPOGEGRAMMENI is
  normalised to the corresponding Greek capital letter WITH [... AND]
  PROSGEGRAMMENI, if a mapping exists in the Unicode standard (by XeTeX but
  not by LuaTeX)

\item \verb|\prosgegrammeni| sets a spacing GREEK PROSGEGRAMMENI:
  \textAlpha\prosgegrammeni{} K\prosgegrammeni{}.

  Spacing is better with the pre-composed characters for Greek capital
  letters \ldots{} WITH PROSGEGRAMMENI.

  Compare Αι (small letter iota) vs. Αι (spacing prosgegrammeni) vs. ᾼ
  (pre-composed).


\end{itemize}
%
Test letters with ypogegrammeni and prosgegrammeni (literal/LICR):

\begin{quote}
 % TODO: infinite recursion with new \MakeUppercase
 % \ifdefined\extrasgreek
 %   \selectlanguage{greek}
 % \fi
 \begin{tabbing}
  unchanged \quad\=  make lowercase\quad\=  make uppercase. \\

  ᾳαι/\textalpha\ypogegrammeni \textalpha\prosgegrammeni{} \>
  \MakeLowercase{ᾳαι/\textalpha\ypogegrammeni \textalpha\prosgegrammeni} \>
  \MakeUppercase{ᾳαι/\textalpha\ypogegrammeni \textalpha\prosgegrammeni} \\

  ᾼΑι/\textAlpha\ypogegrammeni \textAlpha\prosgegrammeni{} \>
  \MakeLowercase{ᾼΑι/\textAlpha\ypogegrammeni \textAlpha\prosgegrammeni} \>
  \MakeUppercase{ᾼΑι/\textAlpha\ypogegrammeni \textAlpha\prosgegrammeni} \\

  ΛͅΛι/\textLambda\ypogegrammeni \textLambda\prosgegrammeni{} \>
  \MakeLowercase{ΛͅΛι/\textLambda\ypogegrammeni \textLambda\prosgegrammeni} \>
  \MakeUppercase{ΛͅΛι/\textLambda\ypogegrammeni \textLambda\prosgegrammeni}

 \end{tabbing}
\end{quote}

\subsection{Additional Greek symbols}

\subsubsection{symbols for Greek numbers}

\begin{quote}
\raggedright
\textkoppa{}      textkoppa                 \\ % ϟ
\textKoppa{}      textKoppa                 \\ % Ϟ
\textqoppa{}      textqoppa (archaic koppa) \\ % ϙ
\textQoppa{}      textQoppa (archaic Koppa) \\ % Ϙ
\textstigma{}     textstigma                \\ % ϛ
% \textvarstigma{}  textvarstigma \\ % no separate Unicode character
\textStigma{}     textStigma (Sigma-Tau-Ligature in CB-fonts)%
\footnote{the name “stigma” originally applied to a medieval sigma-tau
         ligature, whose shape was confusingly similar to the cursive
         digamma}                           \\ % Ϛ
\textsampi{}      textsampi                 \\ % ϡ
\textSampi{}      textSampi                 \\ % Ϡ
\textdigamma{}    textdigamma               \\ % ϝ (\digamma used by amsmath!)
\textDigamma{}    textDigamma               \\ % Ϝ
% numeral signs: http://en.wikipedia.org/wiki/Greek_numerals
\textdexiakeraia{}    textdexiakeraia       \\ % ʹ
\textaristerikeraia{} textaristerikeraia    \\ % ͵
\end{quote}

\subsubsection{symbol variants}

Mathematical notation uses variant shapes of some Greek letters as
additional symbols. The variations have no syntactic meaning in Greek text
and text fonts may use the variant shapes in place of the “regular” ones as
a stylistic choice.

Unicode defines separate code points for the symbol variants. TeX supports
some of the variant shape symbols in mathematical mode, but its concept of
“standard” vs. “variant” symbols differs from the distinction between
“GREEK LETTER ...” vs. “GREEK ... SYMBOL” in the Unicode standard (see
Table \ref{tab:symbol-variants}).

\begin{table}[tbp]
  \centering
  \begin{tabular}{cccc}
  \hline
  \multicolumn{2}{c}{TeX math} & \multicolumn{2}{c}{Unicode} \\
  symbol & var symbol & “letter” & “symbol” \\
  \hline
  $\pi$      & $\varpi$       & π & ϖ \\
  $\rho$     & $\varrho$      & ρ & ϱ \\
  $\theta$   & $\vartheta$    & θ & ϑ \\
  \hline
  $\epsilon$ & $\varepsilon$  & ε & ϵ \\
  $\phi$     & $\varphi$      & φ & ϕ \\
  \hline
  $\beta$    & \emph{missing} & β & ϐ \\
  $\kappa$   & \emph{missing} & κ & ϰ \\
  $\Theta$   & \emph{missing} & Θ & ϴ \\
  \hline
  \end{tabular}
  \caption{Greek symbol variants in TeX and Unicode}
  \label{tab:symbol-variants}
\end{table}

\texttt{tuenc-greek.def} defines three TextCommands for each of these
letters:
\begin{quote}
  \verb|\text<name>| selects the Unicode GREEK LETTER ... variant,

  \verb|\text<name>symbol| selects the Unicode
     GREEK ... SYMBOL variant,

  \verb|\textvar<name>| selects the variant
    shape according to TeX' mathematical mode
\end{quote}
See Table \ref{tab:symbol-variant-macros} for the full list. The
\href{alphabeta-doc.pdf}{\emph{alphabeta}} package defines short macros that
work in text and math mode.

\begin{table}[tbp]
  \centering
  \begin{tabular}{lclc}
  \hline
  \multicolumn{2}{c}{text} & \multicolumn{2}{c}{mathematics} \\
  macro & output & macro & output \\
  \hline
  \verb$\textbeta$          & \textbeta          & \verb$\beta$       & $\beta$       \\
  \verb$\textvarbeta$       & \textvarbeta       & \emph{missing}     & \\
  \verb$\textbetasymbol$    & \textbetasymbol    &                    & \\
  \hline
  \verb$\textepsilon$       & \textepsilon       & \verb$\epsilon$    & $\epsilon$    \\
  \verb$\textvarepsilon$    & \textvarepsilon    & \verb$\varepsilon$ & $\varepsilon$ \\
  \verb$\textepsilonsymbol$ & \textepsilonsymbol &                    & \\
  \hline
  \verb$\texttheta$         & \texttheta         & \verb$\theta$      & $\theta$      \\
  \verb$\textvartheta$      & \textvartheta      & \verb$\vartheta$   & $\vartheta$   \\
  \verb$\textthetasymbol$   & \textthetasymbol   &                    & \\
  \hline
  \verb$\textTheta$         & \textTheta         & \verb$\Theta$      & $\Theta$      \\
  \verb$\textvarTheta$      & \textvarTheta      & \emph{missing}     & \\
  \verb$\textThetasymbol$   & \textThetasymbol   &                    & \\
  \hline
  \verb$\textkappa$         & \textkappa         & \verb$\kappa$      & $\kappa$      \\
  \verb$\textvarkappa$      & \textvarkappa      & \verb$\varkappa$   & $\varkappa$   \\
  \verb$\textkappasymbol$   & \textkappasymbol   &                    & \\
  \hline
  \verb$\textpi$            & \textpi            & \verb$\pi$         & $\pi$         \\
  \verb$\textvarpi$         & \textvarpi         & \verb$\varpi$      & $\varpi$      \\
  \verb$\textpisymbol$      & \textpisymbol      &                    & \\
  \hline
  \verb$\textrho$           & \textrho           & \verb$\rho$        & $\rho$        \\
  \verb$\textvarrho$        & \textvarrho        & \verb$\varrho$     & $\varrho$     \\
  \verb$\textrhosymbol$     & \textrhosymbol     &                    & \\
  \hline
  \verb$\textphi$           & \textphi           & \verb$\phi$        & $\phi$        \\
  \verb$\textvarphi$        & \textvarphi        & \verb$\varphi$     & $\varphi$     \\
  \verb$\textphisymbol$     & \textphisymbol     &                    & \\
  \hline
  \end{tabular}
  \caption{Macros for Greek symbol variants}
  \label{tab:symbol-variant-macros}
\end{table}

\subsubsection{Ancient Greek Numbers}

Ancient Greek Numbers are missing in most fonts (including Libertine and
Deja Vu). The “FreeSerif” font works fine:
\begin{quote}
\textpentedeka    % GREEK ACROPHONIC ATTIC FIFTY
\textpentehekaton % GREEK ACROPHONIC ATTIC FIVE HUNDRED
\textpenteqilioi  % GREEK ACROPHONIC ATTIC FIVE THOUSAND
\textpentemuria   % GREEK ACROPHONIC ATTIC FIFTY THOUSAND
\end{quote}
If the LGR font encoding is loaded via «fontenc» in the document preamble,
Ancient Greek Numbers (as well as any other character) from LGR encoded
8-bit TeX fonts can be used after a font-encoding switch. (This document
defines the \verb|\lgrfont| command for this purpose in the preamble.)
\begin{quote}
\lgrfont{
\textpentedeka    % GREEK ACROPHONIC ATTIC FIFTY
\textpentehekaton % GREEK ACROPHONIC ATTIC FIVE HUNDRED
\textpenteqilioi  % GREEK ACROPHONIC ATTIC FIVE THOUSAND
\textpentemuria   % GREEK ACROPHONIC ATTIC FIFTY THOUSAND
}
\end{quote}


\subsubsection{generic text symbols}

There are some LICR macros for some symbols from the 8-bit font encoding LGR
that are not confined to Greek but not defined in
\texttt{tuenc.def} [2018/08/11 v2.0j].

\begin{quote}
  \textsemicolon{} textsemicolon\\
  \textmicro{} textmicro \\
  \textschwa{} textschwa
\end{quote}
The SI unit prefix MICRO SIGN is not upcased with MakeUppercase:

\begin{quote}
  textmu: \textmu{} $\mapsto$ \MakeUppercase{\textmu} but
  textmicro: \textmicro{} $\mapsto$ \MakeUppercase{\textmicro}.
\end{quote}


\section{Latin transliteration}

The Latin transliteration known from LGR encoded 8-bit fonts%
\footnote{See the \pkgref{teubner} package or the file usage.pdf from
          \pkgref{babel-greek} for a description.}
does not work with Unicode fonts.

For LuaTeX, there is a \texttt{transliteration.omega} \emph{transform} that
applies the transliteration system devised by Yannis Haralambous for the
Omega system (cf. the Babel documentation for the
\href{https://latex3.github.io/babel/guides/locale-greek.html}{Greek locale}).

It is possible to set up LGR encoded fonts parallel to Unicode fonts (see
the preamble of the source file \url{test-tuenc-greek.tex} for an example).
After switching the font encoding to LGR, Greek letters can be input
via a \emph{Latin transliteration}, e.g. «logos» becomes «\lgrfont{logos}»
and «\verb|>aupn\'ia|» becomes «\lgrfont{>aupn\'ia}».

Mark that you cannot use Unicode input with LGR encoded fonts except when
running in 8-bit compatibility mode.
LICR macros work in both, TU and LGR: compare
\>\textIota\textalpha\textnu\textomicron\textupsilon\textalpha
\textrho\acctonos\textiota\textomicron\textupsilon{} (TU) vs.
\lgrfont{\>\textIota\textalpha\textnu\textomicron\textupsilon\textalpha
         \textrho\acctonos\textiota\textomicron\textupsilon} (LGR).


\section{UPPERCASE and lowercase}

According to Greek typesetting conventions, Greek diacritics (except the
dialytika and sub-iota) are placed to the left (instead of above) capital
letters and dropped if text is set in ALL CAPS, e.g. \ensuregreek{μαΐστρος
$\mapsto$ \MakeUppercase{μαΐστρος}}. The macron and breve accents are
handled as in Latin texts.

The new \verb|\MakeUppercase| implementation (rolled out in the
\href{https://www.latex-project.org/news/latex2e-news/ltnews35.pdf}
{June 2022 LaTeX release}) relies on Unicode data. It upcases according to
the Greek conventions \textbf{if the text language is set to Greek} with
\pkgref{babel} or \pkgref{polyglossia}.

For the pre-2022/06 implementation, \texttt{tuenc-greek.def} contains code
to get the same effect.
The uccode/lccode corrections (taken from Apostolos Syropoulos xgreek
package) ensure dropping of accents with \verb|\MakeUppercase| for literal
Unicode characters.

@uclclist additions ensure that upcasing also drops Greek diacritics.
However, when the tonos, varia, and perispomeni accents
are input using the symbol macros (\verb|\' \` \~|), this does not work, as
they cannot be distinguished from Latin acute, grave, and tilde accents.%
If these accents should be dropped by MakeUppercase, they must be input as
named macro:

\begin{quote}
  \ifdefined\extrasgreek
    \selectlanguage{greek}
  \fi
  \acctonos\textalpha\'\textalpha{}  \acctonos a\'a
  \accvaria\textalpha\`\textalpha{}  \accvaria a\`a
  $\mapsto$
  \MakeUppercase{
  \acctonos\textalpha\'\textalpha{}  \acctonos a\'a
  \accvaria\textalpha\`\textalpha{}  \accvaria a\`a
  }
\end{quote}

\subsection{hiatus}

Tonos and psili mark a \emph{hiatus} (break-up of a diphthong) if placed on
the first of two consecutive vowels (άι, άυ, έι, ἀυ, ἄι, ἄυ, ἔι).
A dialytika must be placed on the second vowel if they are dropped.

The «hiatus» feature works with macro input:
\begin{quote}
  % from teubner: άυλος/ΑΫΛΟΣ
  \acctonos\textalpha\textupsilon λος $\mapsto$
  \MakeUppercase{\acctonos\textalpha\textupsilon λος},
  \accpsilioxia\textalpha\textupsilon λος $\mapsto$
  \MakeUppercase{\accpsilioxia\textalpha\textupsilon λος},

  % from http://diacritics.typo.cz/index.php?id=69  μάινα -> ΜΑΪΝΑ
  m\acctonos\textalpha\textiota να $\mapsto$
  \MakeUppercase{m\acctonos\textalpha\textiota να},
  % from  http://de.wikipedia.org/wiki/Neugriechische_Orthographie#Das_Trema
  % κέικ, ἀυπνία/αϋπνία
  \textkappa\acctonos\textepsilon\textiota\textkappa $\mapsto$
  \MakeUppercase{\textkappa\acctonos\textepsilon\textiota\textkappa},
  \accpsili\textalpha\textupsilon πνία $\mapsto$
  \MakeUppercase{\accpsili\textalpha\textupsilon πνία}.
\end{quote}

Since the 2022/06 LaTeX release, it works with monotonic Unicode literals
(since 2023/02/10 also some polytonic)
\begin{quote}
  \ifdefined\extrasgreek
    \selectlanguage{greek}
  \fi
  \newcommand*{\hiatest}{άι, άυ, έι, ἄι, ἄυ, ἔι, ἀυ}
  \hiatest{} $\mapsto$ \MakeUppercase{\hiatest}
\end{quote}
but not with the named accent-macro + Unicode literals
\begin{quote}
  \ifdefined\extrasgreek
    \selectlanguage{greek}
  \fi
  \newcommand*{\hiatest}{
    \acctonos αι, \acctonos αυ, \acctonos ει,
    \accpsilioxia αι, \accpsilioxia αυ, \accpsilioxia ει, \accpsili αυ}
  \hiatest{} $\mapsto$ \MakeUppercase{\hiatest}
\end{quote}
nor with short accent-macro + Unicode literals (yet?)
\begin{quote}
  \ifdefined\extrasgreek
    \selectlanguage{greek}
  \fi
  \newcommand*{\hiatest}{
    \'αι, \'αυ, \'ει, \'>αι, \'>αυ, \'>ει, \>αυ}
  \hiatest{} $\mapsto$ \MakeUppercase{\hiatest}
\end{quote}

\section{Character Tables}

The following tables list the Greek Unicode characters. In the input, the
LICR macro is followed by the corresponding literal Unicode character.

\subsection{Greek and Coptic Unicode block}

Only characters that are supported by LGR encoded TeX fonts have a LICR
definition.

\newcommand{\greekandcoptic}{
% NR    Unicode Name                                       %   babel name, UCS name
% 0370  GREEK CAPITAL LETTER HETA                          % Ͱ
% 0371  GREEK SMALL LETTER HETA                            % ͱ
% 0372  GREEK CAPITAL LETTER ARCHAIC SAMPI                 % Ͳ
% 0373  GREEK SMALL LETTER ARCHAIC SAMPI                   % Ͳ
\textnumeralsigngreek ʹ % \anwtonos, \textdexiakeraia
\textnumeralsignlowergreek ͵ % \katwtonos, \textaristerikeraia,
% 0376  GREEK CAPITAL LETTER PAMPHYLIAN DIGAMMA            % Ͷ
% 0377  GREEK SMALL LETTER PAMPHYLIAN DIGAMMA              % ͷ
{ }\ypogegrammeni ͺ % \textsubiota{\empty}
% 037B  GREEK SMALL REVERSED LUNATE SIGMA SYMBOL           %
% 037C  GREEK SMALL DOTTED LUNATE SIGMA SYMBOL             %
% 037D  GREEK SMALL REVERSED DOTTED LUNATE SIGMA SYMBOL    %
\texterotimatiko ; % \textquestion

\acctonos{ } ΄
\"'{ } ΅
\'\textAlpha Ά
\textanoteleia · % \anoteleia, 00B7 (middle dot) is the preferred character
\'\textEpsilon Έ
\'\textEta Ή
\'\textIota Ί
\'\textOmicron Ό
\'\textUpsilon Ύ
\'\textOmega Ώ

\'"\textiota ΐ
\textAlpha Α
\textBeta Β
\textGamma Γ
\textDelta Δ
\textEpsilon Ε
\textZeta Ζ
\textEta Η
\textTheta Θ
\textIota Ι
\textKappa Κ
\textLambda Λ
\textMu Μ
\textNu Ν
\textXi Ξ
\textOmicron Ο

\textPi Π
\textRho Ρ
\textSigma Σ
\textTau Τ
\textUpsilon Υ
\textPhi Φ
\textChi Χ
\textPsi Ψ
\textOmega Ω
\"\textIota Ϊ
\"\textUpsilon Ϋ
\'\textalpha ά
\'\textepsilon έ
\'\texteta ή
\'\textiota ί

\"'\textupsilon ΰ
\textalpha α
\textbeta β
\textgamma γ
\textdelta δ
\textepsilon ε
\textzeta ζ
\texteta η
\texttheta θ
\textiota ι
\textkappa κ
\textlambda λ
\textmu μ % \textmugreek
\textnu ν
\textxi ξ
\textomicron ο

\textpi π
\textrho ρ
\textfinalsigma ς
\textsigma σ
\texttau τ
\textupsilon υ
\textphi φ
\textchi χ
\textpsi ψ
\textomega ω
\"\textiota ϊ
\"\textupsilon ϋ
\'\textomicron ό
\'\textupsilon ύ
\'\textomega ώ

\textbetasymbol ϐ
\textthetasymbol ϑ
% ϒ ϓ ϔ
\textphisymbol ϕ
\textpisymbol ϖ %ϗ

\textQoppa Ϙ
\textqoppa ϙ
\textStigma Ϛ
\textstigma ϛ
\textDigamma Ϝ
\textdigamma ϝ
\textKoppa Ϟ % \textKoppagreek
\textkoppa ϟ % \koppa, \textqoppa [sic!]

\textSampi Ϡ
\textsampi ϡ

% Ϣ ϣ Ϥ ϥ Ϧ ϧ Ϩ ϩ Ϫ ϫ Ϭ ϭ Ϯ ϯ

\textkappasymbol ϰ
\textrhosymbol ϱ
% ϲ
% ϳ
\textThetasymbol ϴ
\textepsilonsymbol ϵ
% ϶
% Ϸ ϸ
% Ϲ
% Ϻ ϻ ϼ
% Ͻ Ͼ Ͽ
}

\greekandcoptic

\noindent MakeUppercase (TODO: standard accents not dropped, accents from
pre-composed characters dropped since 2022/06, if the text language is set
to Greek):

\foreignlanguage{greek}{
  \MakeUppercase{\greekandcoptic}
}

TODO: Alias \verb|\textvarsigma| not upcased with new MakeUppercase:
\foreignlanguage{greek}{
  \textvarsigma ς → \MakeUppercase{\textvarsigma ς}
}

\noindent MakeLowercase:

\foreignlanguage{greek}{
  \MakeLowercase{\greekandcoptic}
}

\noindent
The lowercase of ΣΣ is \MakeLowercase{ΣΣ}.\footnote{%
  With LaTeX versions since 2022/06,
  the final sigma is used if the algorithm detects the end of a word.}


\subsection{Greek Extended Unicode block}

Note: There are no LICR definitions for spacing diacritical characters.
Use the corresponding accent macro with an empty argument or a space.

\medskip

\newcommand{\greekextended}{
\>\textalpha   ἀ
\<\textalpha   ἁ
\>`\textalpha  ἂ
\<`\textalpha  ἃ
\>'\textalpha  ἄ
\<'\textalpha  ἅ
\~>\textalpha  ἆ
\~<\textalpha  ἇ
\>\textAlpha   Ἀ
\<\textAlpha   Ἁ
\>`\textAlpha  Ἂ
\<`\textAlpha  Ἃ
\>'\textAlpha  Ἄ
\<'\textAlpha  Ἅ
\~>\textAlpha  Ἆ
\~<\textAlpha  Ἇ

\>\textepsilon   ἐ
\<\textepsilon   ἑ
\>`\textepsilon  ἒ
\<`\textepsilon  ἓ
\>'\textepsilon  ἔ
\<'\textepsilon  ἕ
\>\textEpsilon   Ἐ
\<\textEpsilon   Ἑ
\>`\textEpsilon  Ἒ
\<`\textEpsilon  Ἓ
\>'\textEpsilon  Ἔ
\<'\textEpsilon  Ἕ

\>\texteta   ἠ
\<\texteta   ἡ
\>`\texteta  ἢ
\<`\texteta  ἣ
\>'\texteta  ἤ
\<'\texteta  ἥ
\~>\texteta  ἦ
\~<\texteta  ἧ
\>\textEta   Ἠ
\<\textEta   Ἡ
\>`\textEta  Ἢ
\<`\textEta  Ἣ
\>'\textEta  Ἤ
\<'\textEta  Ἥ
\~>\textEta  Ἦ
\~<\textEta  Ἧ

\>\textiota   ἰ
\<\textiota   ἱ
\>`\textiota  ἲ
\<`\textiota  ἳ
\>'\textiota  ἴ
\<'\textiota  ἵ
\~>\textiota  ἶ
\~<\textiota  ἷ
\>\textIota   Ἰ
\<\textIota   Ἱ
\>`\textIota  Ἲ
\<`\textIota  Ἳ
\>'\textIota  Ἴ
\<'\textIota  Ἵ
\~>\textIota  Ἶ
\~<\textIota  Ἷ

\>\textomicron   ὀ
\<\textomicron   ὁ
\>`\textomicron  ὂ
\<`\textomicron  ὃ
\>'\textomicron  ὄ
\<'\textomicron  ὅ
\>\textOmicron   Ὀ
\<\textOmicron   Ὁ
\>`\textOmicron  Ὂ
\<`\textOmicron  Ὃ
\>'\textOmicron  Ὄ
\<'\textOmicron  Ὅ

\>\textupsilon   ὐ
\<\textupsilon   ὑ
\>`\textupsilon  ὒ
\<`\textupsilon  ὓ
\>'\textupsilon  ὔ
\<'\textupsilon  ὕ
\~>\textupsilon  ὖ
\~<\textupsilon  ὗ
\<\textUpsilon   Ὑ
\<`\textUpsilon  Ὓ
\<'\textUpsilon  Ὕ
\~<\textUpsilon  Ὗ

\>\textomega   ὠ
\<\textomega   ὡ
\>`\textomega  ὢ
\<`\textomega  ὣ
\>'\textomega  ὤ
\<'\textomega  ὥ
\~>\textomega  ὦ
\~<\textomega  ὧ
\>\textOmega   Ὠ
\<\textOmega   Ὡ
\>`\textOmega  Ὢ
\<`\textOmega  Ὣ
\>'\textOmega  Ὤ
\<'\textOmega  Ὥ
\~>\textOmega  Ὦ
\~<\textOmega  Ὧ

\accvaria\textalpha   ὰ
\accoxia\textalpha    ά
\accvaria\textepsilon ὲ
\accoxia\textepsilon  έ
\accvaria\texteta     ὴ
\accoxia\texteta      ή
\accvaria\textiota    ὶ
\accoxia\textiota     ί
\accvaria\textomicron ὸ
\accoxia\textomicron  ό
\accvaria\textupsilon ὺ
\accoxia\textupsilon  ύ
\accvaria\textomega   ὼ
\accoxia\textomega    ώ

\>\textalpha\ypogegrammeni   ᾀ
\<\textalpha\ypogegrammeni   ᾁ
\>`\textalpha\ypogegrammeni  ᾂ
\<`\textalpha\ypogegrammeni  ᾃ
\>'\textalpha\ypogegrammeni  ᾄ
\<'\textalpha\ypogegrammeni  ᾅ
\~>\textalpha\ypogegrammeni  ᾆ
\~<\textalpha\ypogegrammeni  ᾇ
\>\textAlpha\ypogegrammeni   ᾈ
\<\textAlpha\ypogegrammeni   ᾉ
\>`\textAlpha\ypogegrammeni  ᾊ
\<`\textAlpha\ypogegrammeni  ᾋ
\>'\textAlpha\ypogegrammeni  ᾌ
\<'\textAlpha\ypogegrammeni  ᾍ
\~>\textAlpha\ypogegrammeni  ᾎ
\~<\textAlpha\ypogegrammeni  ᾏ

\>\texteta\ypogegrammeni     ᾐ
\<\texteta\ypogegrammeni     ᾑ
\>`\texteta\ypogegrammeni    ᾒ
\<`\texteta\ypogegrammeni    ᾓ
\>'\texteta\ypogegrammeni    ᾔ
\<'\texteta\ypogegrammeni    ᾕ
\~>\texteta\ypogegrammeni    ᾖ
\~<\texteta\ypogegrammeni    ᾗ
\>\textEta\ypogegrammeni     ᾘ
\<\textEta\ypogegrammeni     ᾙ
\>`\textEta\ypogegrammeni    ᾚ
\<`\textEta\ypogegrammeni    ᾛ
\>'\textEta\ypogegrammeni    ᾜ
\<'\textEta\ypogegrammeni    ᾝ
\~>\textEta\ypogegrammeni    ᾞ
\~<\textEta\ypogegrammeni    ᾟ

\>\textomega\ypogegrammeni   ᾠ
\<\textomega\ypogegrammeni   ᾡ
\>`\textomega\ypogegrammeni  ᾢ
\<`\textomega\ypogegrammeni  ᾣ
\>'\textomega\ypogegrammeni  ᾤ
\<'\textomega\ypogegrammeni  ᾥ
\~>\textomega\ypogegrammeni  ᾦ
\~<\textomega\ypogegrammeni  ᾧ
\>\textOmega\ypogegrammeni   ᾨ
\<\textOmega\ypogegrammeni   ᾩ
\>`\textOmega\ypogegrammeni  ᾪ
\<`\textOmega\ypogegrammeni  ᾫ
\>'\textOmega\ypogegrammeni  ᾬ
\<'\textOmega\ypogegrammeni  ᾭ
\~>\textOmega\ypogegrammeni  ᾮ
\~<\textOmega\ypogegrammeni  ᾯ

\u\textalpha                      ᾰ
\=\textalpha                      ᾱ
\accvaria\textalpha\ypogegrammeni ᾲ
\textalpha\ypogegrammeni          ᾳ
\accoxia\textalpha\ypogegrammeni  ᾴ
\~\textalpha                      ᾶ
\~\textalpha\ypogegrammeni        ᾷ
\u\textAlpha                      Ᾰ
\=\textAlpha                      Ᾱ
\accvaria\textAlpha               Ὰ
\accoxia\textAlpha                Ά
\textAlpha\ypogegrammeni          ᾼ
\>{ }                             ᾽
{ }\prosgegrammeni                ι
\>{ }                             ᾿

\accperispomeni{ }                ῀
\"\~{ }                           ῁
\accvaria\texteta\ypogegrammeni   ῂ
\texteta\ypogegrammeni            ῃ
\accoxia\texteta\ypogegrammeni    ῄ
\~\texteta                        ῆ
\~\texteta\ypogegrammeni          ῇ
\accvaria\textEpsilon             Ὲ
\accoxia\textEpsilon              Έ
\accvaria\textEta                 Ὴ
\accoxia\textEta                  Ή
\textEta\ypogegrammeni            ῌ
\>`{ }                            ῍
\>'{ }                            ῎
\~>{ }                            ῏

\u\textiota                       ῐ
\=\textiota                       ῑ
\`"\textiota                      ῒ
\'"\textiota                      ΐ
\~\textiota                       ῖ
\~"\textiota                      ῗ
\u\textIota                       Ῐ
\=\textIota                       Ῑ
\accvaria\textIota                Ὶ
\accoxia\textIota                 Ί
  \<`{ }                          ῝
\>'{ }                            ῞
\~<{ }                            ῟

\u\textupsilon                    ῠ
\=\textupsilon                    ῡ
\`"\textupsilon                   ῢ
\'"\textupsilon                   ΰ
\>\textrho                        ῤ
\<\textrho                        ῥ
\~\textupsilon                    ῦ
\~"\textupsilon                   ῧ
\u\textUpsilon                    Ῠ
\=\textUpsilon                    Ῡ
\accvaria\textUpsilon             Ὺ
\accoxia\textUpsilon              Ύ
\<\textRho                        Ῥ
\`"{ }                            ῭
\'"{ }                            ΅
\accvaria{ }                      `

\accvaria\textomega\ypogegrammeni ῲ
\textomega\ypogegrammeni          ῳ
\accoxia\textomega\ypogegrammeni  ῴ
\~\textomega                      ῶ
\~\textomega\ypogegrammeni        ῷ
\accvaria\textOmicron             Ὸ
\accoxia\textOmicron              Ό
\accvaria\textOmega               Ὼ
\accoxia\textOmega                Ώ
\textOmega\ypogegrammeni          ῼ
\accoxia{ }                       ´
\<{ }                             ῾
}

\greekextended

\noindent MakeUppercase:

\foreignlanguage{greek}{
  \MakeUppercase{\greekextended}
}

\noindent MakeLowercase:

\foreignlanguage{greek}{
  \MakeLowercase{\greekextended}
}

\subsection{Character Tables: accent + literal base character}

With Xe/LuaTeX and Unicode fonts, diacritics may also be input using
accent macros on a literal Unicode base character.

\subsubsection{Greek and Coptic Unicode block}

\renewcommand{\greekandcoptic}{

\'ΑΆ \'ΕΈ \'ΗΉ \'ΙΊ \'ΟΌ \'ΥΎ \'ΩΏ

\"'ιΐ \"ΙΪ \"ΥΫ \'αά \'εέ \'ηή \'ιί

\"'υΰ

\"ιϊ \"υϋ \'οό \'υύ \'ωώ
}

Accented letters from the Greek and Coptic Unicode Block

\greekandcoptic

\noindent MakeUppercase:

\foreignlanguage{greek}{
  \MakeUppercase{\greekandcoptic}
}

\noindent MakeLowercase:

\foreignlanguage{greek}{
  \MakeLowercase{\greekandcoptic}
}

\subsubsection{Greek Extended Unicode block}


\renewcommand{\greekextended}{
\>αἀ \<αἁ \>`αἂ \<`αἃ \>'αἄ \<'αἅ \~>αἆ \~<αἇ
\>ΑἈ \<ΑἉ \>`ΑἊ \<`ΑἋ \>'ΑἌ \<'ΑἍ \~>ΑἎ \~<ΑἏ

\>εἐ \<εἑ \>`εἒ \<`εἓ \>'εἔ \<'εἕ
\>ΕἘ \<ΕἙ \>`ΕἚ \<`ΕἛ \>'ΕἜ \<'ΕἝ

\>ηἠ \<ηἡ \>`ηἢ \<`ηἣ \>'ηἤ \<'ηἥ \~>ηἦ \~<ηἧ
\>ΗἨ \<ΗἩ \>`ΗἪ \<`ΗἫ \>'ΗἬ \<'ΗἭ \~>ΗἮ \~<ΗἯ

\>ιἰ \<ιἱ \>`ιἲ \<`ιἳ \>'ιἴ \<'ιἵ \~>ιἶ \~<ιἷ
\>ΙἸ \<ΙἹ \>`ΙἺ \<`ΙἻ \>'ΙἼ \<'ΙἽ \~>ΙἾ \~<ΙἿ

\>οὀ \<οὁ \>`οὂ \<`οὃ \>'οὄ \<'οὅ
\>ΟὈ \<ΟὉ \>`ΟὊ \<`ΟὋ \>'ΟὌ \<'ΟὍ

\>υὐ \<υὑ \>`υὒ \<`υὓ \>'υὔ \<'υὕ \~>υὖ \~<υὗ
\<ΥὙ \<`ΥὛ \<'ΥὝ \~<ΥὟ

\>ωὠ \<ωὡ \>`ωὢ \<`ωὣ \>'ωὤ \<'ωὥ \~>ωὦ \~<ωὧ
\>ΩὨ \<ΩὩ \>`ΩὪ \<`ΩὫ \>'ΩὬ \<'ΩὭ \~>ΩὮ \~<ΩὯ

\`αὰ \'αά \`εὲ \'εέ \`ηὴ \'ηή \`ιὶ \'ιί \`οὸ \'οό \`υὺ \'υύ \`ωὼ \'ωώ

\>α\ypogegrammeni   ᾀ
\<α\ypogegrammeni   ᾁ
\>`α\ypogegrammeni  ᾂ
\<`α\ypogegrammeni  ᾃ
\>'α\ypogegrammeni  ᾄ
\<'α\ypogegrammeni  ᾅ
\~>α\ypogegrammeni  ᾆ
\~<α\ypogegrammeni  ᾇ
\>Α\ypogegrammeni   ᾈ
\<Α\ypogegrammeni   ᾉ
\>`Α\ypogegrammeni  ᾊ
\<`Α\ypogegrammeni  ᾋ
\>'Α\ypogegrammeni  ᾌ
\<'Α\ypogegrammeni  ᾍ
\~>Α\ypogegrammeni  ᾎ
\~<Α\ypogegrammeni  ᾏ

\>η\ypogegrammeni   ᾐ
\<η\ypogegrammeni   ᾑ
\>`η\ypogegrammeni  ᾒ
\<`η\ypogegrammeni  ᾓ
\>'η\ypogegrammeni  ᾔ
\<'η\ypogegrammeni  ᾕ
\~>η\ypogegrammeni  ᾖ
\~<η\ypogegrammeni  ᾗ
\>Η\ypogegrammeni   ᾘ
\<Η\ypogegrammeni   ᾙ
\>`Η\ypogegrammeni  ᾚ
\<`Η\ypogegrammeni  ᾛ
\>'Η\ypogegrammeni  ᾜ
\<'Η\ypogegrammeni  ᾝ
\~>Η\ypogegrammeni  ᾞ
\~<Η\ypogegrammeni  ᾟ

\>ω\ypogegrammeni   ᾠ
\<ω\ypogegrammeni   ᾡ
\>`ω\ypogegrammeni  ᾢ
\<`ω\ypogegrammeni  ᾣ
\>'ω\ypogegrammeni  ᾤ
\<'ω\ypogegrammeni  ᾥ
\~>ω\ypogegrammeni  ᾦ
\~<ω\ypogegrammeni  ᾧ
\>Ω\ypogegrammeni   ᾨ
\<Ω\ypogegrammeni   ᾩ
\>`Ω\ypogegrammeni  ᾪ
\<`Ω\ypogegrammeni  ᾫ
\>'Ω\ypogegrammeni  ᾬ
\<'Ω\ypogegrammeni  ᾭ
\~>Ω\ypogegrammeni  ᾮ
\~<Ω\ypogegrammeni  ᾯ

\u αᾰ \= αᾱ
\`α\ypogegrammeni ᾲ
α\ypogegrammeni   ᾳ
\'α\ypogegrammeni ᾴ
\~αᾶ
\~α\ypogegrammeni ᾷ
\u ΑᾸ \= ΑᾹ \`ΑᾺ \'ΑΆ
Α\ypogegrammeni ᾼ

\`η\ypogegrammeni ῂ
η\ypogegrammeni   ῃ
\'η\ypogegrammeni ῄ
\~ηῆ
\~η\ypogegrammeni ῇ
\`ΕῈ \'ΕΈ \`ΗῊ \'ΗΉ
Η\ypogegrammeni ῌ

\u ιῐ \=ιῑ \"`ιῒ \"'ιΐ \~ιῖ \"~ιῗ \u ΙῘ \= ΙῙ \`ΙῚ \'ΙΊ

\u υῠ \=υῡ \"`υῢ \'"υΰ \>ρῤ \<ρῥ \~υῦ \~"υῧ
\u ΥῨ \=ΥῩ \`ΥῪ \'ΥΎ \<ΡῬ

\`ω\ypogegrammeni ῲ
ω\ypogegrammeni   ῳ
\'ω\ypogegrammeni ῴ
\~ω               ῶ
\~ω\ypogegrammeni ῷ
\`ΟῸ \'ΟΌ \`ΩῺ \'ΩΏ
Ω\ypogegrammeni ῼ
}

Accented letters from the Greek Extended Unicode block

\greekextended


\medskip
\noindent MakeUppercase:

\foreignlanguage{greek}{
\MakeUppercase{\greekextended}
}

\medskip
\noindent MakeLowercase:

\foreignlanguage{greek}{
\MakeLowercase{\greekextended}
}
\end{document}
