%&LaTeX

\documentclass[reqno]{amsart}

\AtBeginDocument{{\noindent\small
{\em Electronic Journal of Differential Equations},
Vol. 2002(2002), No. 93, pp. 1--23.\newline
ISSN: 1072-6691. URL: http://ejde.math.swt.edu or http://ejde.math.unt.edu
\newline ftp ejde.math.swt.edu  (login: ftp)}
\thanks{\copyright 2002 Southwest Texas State University.}
\vspace{9mm}}

\begin{document}

\title[\hfilneg EJDE--2002/93\hfil A degenerate parabolic equation]
{On a nonlinear degenerate parabolic transport-diffusion equation
with a discontinuous coefficient}

\author[K. H. Karlsen, N. H. Risebro, \&  J. D. Towers\hfil EJDE--2002/93\hfilneg]
{Kenneth H. Karlsen, Nils H. Risebro, \&  John D. Towers }

\address{Kenneth H. Karlsen \newline
  Department of Mathematics,
  University of Bergen\newline
  Johs.\ Brunsgt.\ 12\newline
  N--5008 Bergen, Norway}
\email{kennethk@math.uib.no}
\urladdr{www.mi.uib.no/$\sim$kennethk}

\address{Nils H. Risebro\newline
  Department of Mathematics,
  University of Oslo\newline
  P.O.\ Box 1053, Blindern\newline
  N--0316 Oslo, Norway}
\email{nilshr@math.uio.no}
\urladdr{www.math.uio.no/$\sim$nilshr}

\address{John D. Towers\newline
MiraCosta College\newline
3333 Manchester Avenue \newline
Cardiff-by-the-Sea, CA 92007-1516, USA}
\email{jtowers@cts.com}
\urladdr{www.miracosta.cc.ca.us/home/jtowers/}


\date{}
\thanks{Submitted April 29, 2002. Published October 27, 2002.}
\subjclass[2000]{35K65, 35D05, 35R05, 35L80}
\keywords{Degenerate parabolic equation, nonconvex flux, weak solution,
\break\indent
discontinuous coefficient,  viscosity method,
a priori estimates, compensated compactness }

\begin{abstract}
   We study the Cauchy problem for
   the nonlinear (possibly strongly) degenerate
   parabolic transport-diffusion equation
   $$
   \partial_t  u + \partial_x \bigl(\gamma(x)f(u)\bigr)=\partial_x^2 A(u),
   \quad A'(\cdot)\ge 0,
   $$
   where the coefficient $\gamma(x)$ is possibly discontinuous and
   $f(u)$ is genuinely nonlinear, but not necessarily
   convex or concave. Existence of a weak solution is proved by
   passing to the limit as $\varepsilon\downarrow 0$ in a suitable
   sequence $\{u_{\varepsilon}\}_{\varepsilon>0}$ of
   smooth approximations solving the problem above with the transport
   flux $\gamma(x)f(\cdot)$ re\nolinebreak{}placed 
   by $\gamma_{\varepsilon}(x)f(\cdot)$
   and the diffusion function $A(\cdot)$ replaced by
   $A_{\varepsilon}(\cdot)$,
   where $\gamma_{\varepsilon}(\cdot)$ is smooth and
   $A_{\varepsilon}'(\cdot)>0$.
   The main technical challenge is to deal with the fact
   that the total variation $|u_{\varepsilon}|_{BV}$
   cannot be bounded uniformly in $\varepsilon$, and hence one
   cannot derive directly strong convergence of
   $\{u_{\varepsilon}\}_{\varepsilon>0}$. In the purely hyperbolic case
   ($A'\equiv 0$),  where existence has already been established by a
   number of authors,  all existence results to date have used a
   singular ma\nolinebreak{}pping to overcome the lack of a variation bound.
   Here we derive instead strong convergence via a series of
   a priori (energy) estimates that allow us to deduce convergence
   of the  diffusion function and use the  compensated compactness
   method to deal with the transport term.
\end{abstract}

\maketitle

\numberwithin{equation}{section}
\newcommand{\seq}[1]{\left\{#1\right\}}
\newcommand{\norm}[2]{\left\|#1\right\|_{#2}}
\newcommand{\abs}[1]{\left|#1\right|}

\newtheorem{theorem}{Theorem}[section]
\newtheorem*{theorem*}{Main Theorem}
\newtheorem{prop}[theorem]{Proposition}
\newtheorem{lemma}[theorem]{Lemma}
\newtheorem{definition}[theorem]{Definition}
\newtheorem{remark}[theorem]{Remark}
\numberwithin{equation}{section}
\allowdisplaybreaks

\section{Introduction}\label{sec:intro}

In this paper we prove existence of a weak solution
to the Cauchy problem for a
one-dimensional scalar degenerate parabolic equation
with a nonlinear transport term that depends
explicitly on the spatial position through a
coefficient $\gamma(x)$ that may be discontinuous. More precisely, the problem
that we study takes the form
\begin{equation}
   \label{eq:prob1}
   \begin{aligned}
      &\partial_t u + \partial_x  \bigl(\gamma(x)f(u)\bigr)
      =  \partial_x^2 A(u), \quad
      (x,t)\in \Pi_T=\mathbb{R}\times(0,T),\\
      &u(x,0)=u_{0}(x), \quad x\in \mathbb{R},
   \end{aligned}
\end{equation}
where $T>0$ is fixed, $u:\Pi_T\to \mathbb{R}$ is the unknown function that is sought,
and $\gamma,f,A,u_0$ are given functions.
Regarding $\gamma(\cdot)$, we
make the assumptions
\begin{equation}
   \label{gamma_ass}
   \text{$\underline{\gamma}\le \gamma(x)\le \overline{\gamma}$ for
   some constants $\underline{\gamma}$,
   $\overline{\gamma}$; $|\gamma(x)|>0$ a.e.~on $\mathbb{R}$;
   $\gamma\in BV(\mathbb{R})$.}
\end{equation}
In other words, the ``transport part'' of \eqref{eq:prob1} depends
explicitly on the spatial location and this dependency
may be discontinuous. Regarding the
function $f(\cdot)$, we assume that
\begin{equation}
   \label{f_ass}
      \text{$f \in C^2[0,1]$ with $f(0)=f(1)=0$;
            $f$ genuinely nonlinear,}
\end{equation}
but no convexity condition is assumed.
As usual, ``$f$ genuinely nonlinear'' means that there is no subinterval
of $[0,1]$ on which $f$ is linear.
We require that the diffusion function $A(\cdot)$ satisfies
\begin{equation}
    \label{A_ass}
    \text{$A(\cdot)\in C^2([0,1])$; $A(\cdot)$ nondecreasing with $A(0)=0$}.
\end{equation}
Finally, we assume that the initial function $u_0(\cdot)$
satisfies
\begin{equation}
   \label{unull_ass}
   \text{$u_0\in L^{\infty}(\mathbb{R})\cap L^1(\mathbb{R})$;
     $u_0(x)\in [0,1]$ for a.e.~$x\in\mathbb{R}$.}
\end{equation}
The assumption that $f(0)=f(1)=0$ is motivated by considerations
like the following: Consider the initial value problem
$$
\partial_t u -
\partial_x \Big(\frac{\mathop{\rm sign}{(x)}}{1+\abs{u}}\Big) = 0,\quad u(x,0)=0.
$$
The entropy solution to this problem is
$$
u(x,t)=\max\Big\{0,\,
    \sqrt{\abs{t/x}}-1\,\Big\}.
$$
Clearly $u(x,t)$ is unbounded, and the reason for this is that
$f(u)=1/(1+\abs{u})\ne 0$ for any $u$. Furthermore, $u(x,t)$ is
also an entropy solution if we modify $f$ to read
$$
f(u)=\begin{cases}
    0, & u<-1, \\
    -3u^3 - 5u^2 - u +1, & -1\le u < 0,\\
    1/(1+u), & u\ge 0.
\end{cases}
$$
In this case $f$ is continuously differentiable, and $f(-1)=0$,
however $f(u)>0$ for all $u>-1$.
Hence, to bound weak solutions, we
shall need the assumption that there exist numbers $\alpha<\beta$
such that $f(\alpha)=f(\beta)=0$ and that $u_{0}(x)\in
[\alpha,\beta]$ for all $x$.
To make the presentation simple, we normalize such
that $\alpha=0$, $\beta=1$.

As we have just seen, the ``degenerate parabolicity'' condition
\eqref{A_ass} is general enough to include as a special case of
\eqref{eq:prob1} the hyperbolic conservation law with discontinuous
coefficient:
\begin{equation}
   \label{eq:hyp}
   \partial_t  u + \partial_x  \bigl(\gamma(x)f(u)\bigr)= 0.
\end{equation}
This equation is used to model a variety of phenomena, among which are
traffic flow \cite{Whitham} and flow of hydrocarbons in porous media. In
addition, such equations occur when solving Hamilton-Jacobi equations
numerically by dimensional splitting \cite{KR:HJsplitt}.

Independently of the smoothness of $\gamma(\cdot)$, if \eqref{eq:prob1}
is allowed to degenerate at certain points, that is,
$A'(s)=0$ for some values of $s$, solutions are not
necessarily smooth and weak solutions must be sought.
A \textit{weak solution} is defined as follows:

\begin{definition}    \label{weak_def} \rm
   A weak solution of \eqref{eq:prob1} is
   a measurable function $u=u(x,t)$ satisfying:
   \begin{enumerate}
      \item[D1] $u\in L^1(\Pi_T)\bigcap L^{\infty}(\Pi_T)$ and
      $A(u) \in L^2(0,T;H^1(\mathbb{R}))$. \label{def:weak1}

      \item[D2] For all $\varphi\in \mathcal{D}(\mathbb{R}\times [0,T))$,
      \begin{align}
         \label{weak_cond}
         \begin{split}
            \iint_{\Pi_T}\Bigl(u\partial_t \varphi &
            + \bigl[\gamma(x)f(u)
            -\partial_x A(u)\bigr]\partial_x\varphi\Bigr)\, dt\, dx
            + \int_{\mathbb{R}} u_0(x)\phi(x,0)= 0.
         \end{split}
       \end{align}\label{def:weak2}
   \end{enumerate}
\end{definition}

On the other hand, if $A'(s)$ is
zero on an interval $[\alpha,\beta]$, (weak) solutions
may be discontinuous and they are not
uniquely determined by their initial data.
Consequently, an entropy condition must be imposed to
single out the physically correct solution. If $\gamma(\cdot)$ is
sufficiently ``smooth'',
a weak solution $u$ satisfies the \textit{entropy condition} if
for all convex $C^2$ functions $\eta:\mathbb{R}\to\mathbb{R}$,
\begin{align}
   \label{Convex_entropy_cond}
   \begin{split}
     \partial_t \eta(u)
      + \partial_x\bigl(\gamma(x)q(u)\bigr) +\partial_x^2 r(u)
      + \gamma'(x)\bigl(\eta'(u)f(u)-q(u)\bigr)
      \le 0 \,\, \text{in $\mathcal{D}^\prime(\Pi_T)$},
   \end{split}
\end{align}
where $q,r:\mathbb{R}\to \mathbb{R}$ are defined by
$q'(u)=\eta'(u)f'(u)$ and $r'(u)=\eta'(u)A'(u)$.
By standard limiting argument, \eqref{Convex_entropy_cond} implies
that the Kru\v{z}kov-type entropy condition
\begin{align}
   \label{entropy_cond}
   \begin{split}
      \partial_t |u-c| &+
      \partial_x\Bigl(\gamma(x)\mathop{\rm sign}(u-c)\bigl(f(u)-f(c)\bigr)\Bigr) \\
      &+ \partial_x^2\abs{A(u)-A(c)}
      + \gamma'(x)\mathop{\rm sign}(u-c)f(c) \le 0
   \end{split}
\end{align}
holds in $\mathcal{D}^\prime(\Pi_T)$ for all $c\in\mathbb{R}$.
For pure hyperbolic equations, the entropy
condition \eqref{entropy_cond} was introduced
by Kru\v{z}kov \cite{Kruzkov} and Vol'pert \cite{Volpert}.
For degenerate parabolic equations, it must be
attributed to Vol'pert and Hudjaev \cite{VolHud}.
The main reference on the uniqueness and stability of entropy solutions
of degenerate parabolic equations is the recent paper
by Carrillo \cite{Carrillo} (see also Chen and
DiBenedetto \cite{ChenDiBen}), which in turn is a generalization
of Kru\v{z}kov's work on hyperbolic equations.
Following \cite{Carrillo}, it was proved in
\cite{KR:Rough_Unique} that the entropy
solution of \eqref{eq:prob1} (as well
as a more general equation in multi-dimensions) is unique
when $\gamma(\cdot)$ is ``smooth''.
Moreover, in the $L^{\infty}(0,T;BV(\mathbb{R}^d))$ class of entropy solutions, an
$L^1$ contraction principle as well as ``continuous dependence''
estimates were proved.
Recently there seems to be renewed interest
in applying ``hyperbolic'' techniques to degenerate parabolic equations.
For a partial overview of mathematical and numerical theory
for degenerate parabolic equations based on
``hyperbolic'' techniques, see the lecture notes \cite{EspKar}.

In this paper, we are interested in taking a first step towards
developing a well-posedness theory for degenerate parabolic
equations with discontinuous coefficients.  To be a bit more precise,
we aim at proving existence of a weak solution to \eqref{eq:prob1}
when the coefficient $\gamma(x)$ may depend discontinuously on $x$.
We will also prove uniqueness of the constructed weak solution.

Let $u_{\varepsilon}$ be the unique classical solution of
uniformly parabolic problem
\begin{align*}
      &\partial_t u_{\varepsilon}+\partial_x \bigl(\gamma_{\varepsilon}(x)
     f(u_{\varepsilon})\bigr)=
      \partial_x^2 A_{\varepsilon}(u_{\varepsilon}), \quad (x,t)\in \Pi_T, \\
     & u_{\varepsilon}(x,0)={u_0}_{\varepsilon}(x),    \quad x\in\mathbb{R},
\end{align*}
where $\gamma_{\varepsilon}$ is a smooth coefficient, $A_{\varepsilon}'(\cdot)>0$, and
${u_0}_{\varepsilon}$ is a smooth initial function (see Section
\ref{sec:existence} for precise statements).
We prove existence of
a weak solution of \eqref{eq:prob1} by establishing strong convergence
of the sequence $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$ of smooth
approximations. Roughly speaking, our
main theorem can be stated as follows:

\begin{theorem*}
    The sequence of $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$
    converges strongly in $L^1$ to a weak solution $u$ of
    \eqref{eq:prob1}. Furthermore, a subsequence
    of $\left\{A_{\varepsilon}(u_{\varepsilon})\right\}_{\varepsilon>0}$ converges
    uniformly on compact sets
    to a H\"older continuous function that coincides with $A(u)$ a.e.
\end{theorem*}
Since $\gamma(\cdot)$ may be discontinuous , the total
variation $|u_{\varepsilon}|_{BV}$ cannot be bounded uniformly with respect to
$\varepsilon>0$.  This point will be discussed
below when we put this work in  perspective by reviewing the
available literature on the subject (which exclusively deals with the
hyperbolic case).  The lack of a variation bound prevents an
application of the standard $BV$ compactness argument to
$\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$.  To circumvent this analytical
difficulty, we establish instead strong compactness of the
diffusion function $\{A_{\varepsilon}(u_{\varepsilon})\}_{\varepsilon>0}$ as
well as the ``total flux'' $\{\gamma_{\varepsilon}(x)f(u_{\varepsilon})
- \partial_x A_{\varepsilon}(u_{\varepsilon})\}_{\varepsilon>0}$.  Using the
compactness of these two sequences along with the compensated
compactness method of Murat and Tartar \cite{MuratII,MuratI,Murat:Hneg,TartarI}
to handle the nonlinear transport term, we get strong convergence
along a subsequence of $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$ to a weak
solution of \eqref{eq:prob1}. The constructed weak solution
is unique thanks to a stability result
in \cite{KR:Rough_Unique}. The detailed proofs are found in
Section~\ref{sec:existence}, while the compensated compactness method is
recalled in Section~\ref{sec:CC}.

When $A'(\cdot)\equiv 0$, the classical Kru\v{z}kov theory applies to the
hyperbolic problem \eqref{eq:hyp} only if the coefficient $\gamma$ is
continuously differentiable.  In the case of a discontinuous
coefficient, the notion of entropy solution \eqref{entropy_cond} as
well as the accompanying existence and uniqueness theory
breaks down.  When $\gamma(\cdot)$ is
discontinuous, the hyperbolic equation \eqref{eq:hyp} has often been
written as a $2\times 2$ system of equations to facilitate the
analysis:
\begin{equation}
   \partial_t \gamma=0, \quad  \partial_t u +\partial_x \bigl(\gamma f(u)\bigr)=0.
     \label{eq:hypsys}
\end{equation}
If $f'(\cdot)$ changes sign, then this system is non-strictly
hyperbolic, a situation described as resonance. An important
consequence of resonance is that no a priori bound on the spatial
variation of the conserved quantity is available, in marked contrast to
the smooth $\gamma$ situation where the Kru\v{z}kov theory applies. For example,
when the initial data is approximated by a sequence of piecewise
constant functions, this can cause the spatial variation to blow
up as the discretization parameter tends to zero \cite{Temple,TveiWi:Hard}.

With no spatial variation bound available for the conserved
quantity, an alternative method of establishing compactness is
required.  To date, all existence results for the case of a
discontinuous coefficient have employed some form of
singular mapping, that is a nonlinear transformation of the conserved quantity.
Indeed, the present work is the first to prove strong
convergence of approximate solutions without appealing to the
singular mapping technique, which was introduced
by Temple \cite{Temple} in order to
establish convergence of the Glimm scheme for a $2 \times 2$
resonant system of conservation laws modeling the displacement of oil in a
reservoir by water and polymer. For the
equation \eqref{eq:hyp}, the singular mapping takes the form
\begin{equation}
    \label{eq:singular-mapping}
    \Psi(u,\gamma) = \gamma \int_0^u |f'(\xi)|\, d\xi,
\end{equation}
from which it is clear that $\Psi$ assigns vanishingly small
weight to variations in
$u$ in the resonant regions (where $f'=0$). This makes it possible
to establish a uniform variation bound for the transformed version
of the conserved quantity, thus establishing compactness for the
approximating sequence in the transformed variable. The singular
mapping $\Psi$ is continuous and strictly monotone as a function of the
conserved quantity, which allows the conserved quantity to be
recovered after passing to the limit in the transformed variable.

In addition to the Glimm scheme, convergence has been established
for the $2 \times 2$ Godunov method by  Lin, Temple, and Wang
\cite{LTW:Comparison,LTW:Suppression}.
Specifically, they applied the $2 \times 2$ Godunov
method to the system
\begin{equation}
   \partial_t \gamma=0, \quad  \partial_t u +\partial_x f(\gamma(x),u)=0,
     \label{eq:hypsys-1}
\end{equation}
and used a version of the singular mapping to establish compactness (see
also Hong \cite{JohnHong:2000} for
an ``improved'' singular mapping).  They also
observed that a uniform variation bound (measured via the singular
mapping) had not been proven for any scalar schemes that apply to
\eqref{eq:hypsys-1}, nor for the $2\times2$ Lax-Friedrichs method.
Such bounds have since been established for the scalar
Engquist-Osher and Godunov schemes \cite{TowersI, TowersII}.
Furthermore, with the present work, we add to that list convergence of the
vanishing viscosity/smoothing method.
However, no bound has yet been established for either the scalar or $2\times
2$ version of the Lax-Friedrichs scheme, and thus convergence is
yet to be proven.  Numerical evidence indicates that the
Lax-Friedrichs scheme is well-behaved on these problems; it is the
theory that is deficient at this point.  Our investigation of the
compensated compactness approach, which represents a departure
from the singular mapping technique, is partially motivated by our
desire to find a method that will provide a proof of convergence
for the Lax-Friedrichs scheme.


The front tracking method, which is based on the
work of Dafermos \cite{Dafermos} and
Holden, Holden, and H{\o}egh-Krohn \cite{HoldenHoegh},
has been applied to a number
of hyperbolic problems with discontinuous coefficients. Gimse and
Risebro \cite{Gimsebro:Cauchy} used the front
tracking method to study the two phase flow equation ($s$ denotes
the saturation of one of the phases)
\begin{equation}
   \partial_t s + \partial_x\bigl(f_0(s)(1-g(x)k(s))\bigr)=0,
     \label{eq:2phase}
\end{equation}
where $f_0$ is the so-called fractional flow function, $g(x)$
models the gravitational pull multiplied by the absolute permeability
of the porous medium, and $k(s)$ is the relative permeability
of the relevant phase. In \eqref{eq:2phase}, the
spatially varying coefficient $g(x)$ may be discontinuous.
Gimse and Risebro proved compactness of the sequence of approximations via a
bound on the spatial variation, measured with respect to the
singular mapping. For the scalar conservation law with a concave flux,
Klingenberg and Risebro \cite{KlingbroI} used the front tracking technique to
establish existence, uniqueness, and asymptotic behavior for the
Cauchy problem \eqref{eq:hypsys}.  In \cite{KlingbroI} also, the
singular mapping was the method used to
establish compactness of the approximating sequence.
Concerning uniqueness and stability with
respect to perturbations of the initial data,
the discontinuity of the flux parameter
complicates the analysis. Specifically, the Kru\v{z}kov entropy
condition \eqref{entropy_cond} no longer makes sense,
thus requiring an alternative approach.
To overcome this difficulty, Klingenberg and
Risebro used a so-called wave entropy condition, which allowed
them to prove uniqueness for the limit of the approximate solutions.
For this same concave flux problem,
Klausen and Risebro \cite{KlausenRisebro} proved continuous dependence on the
coefficient $\gamma$ and on the initial data. The approach in
\cite{KlausenRisebro} was to prove that the solution
constructed via the front tracking
approach is the limit of the solutions that result when the
coefficient $\gamma$ is smoothed. The classical Kru\v{z}kov
$L^1$ stability theory applies when
$\gamma$ is smoothed, and the limit solution inherits this stability.
The front tracking method has also been
applied to the situation where the flux $f$ is neither concave nor convex.
Klingenberg and Risebro \cite{KlingbroII} established existence
and uniqueness for the nonconvex flux
$f(u)=\sin(u)$ for $u \in [-\pi,\pi]$. A version
of the singular mapping was used here also, and uniqueness was
established by passing to the limit in a sequence of solutions
corresponding to a smoothed version of $\gamma$.

Convergence of scalar difference schemes for the
case of a smooth spatially varying
flux has been known for many years. For $\gamma \in
C^2\left(\mathbb{R}^d\right)$, convergence of the Lax-Friedrichs
scheme and the upwind scheme was proved in \cite{Oleinik:Discont}.
Under weaker conditions on $\gamma$, e.g., $\gamma'\in BV$, and
for $f$ convex in $u$, convergence of the one-dimensional Godunov
method for \eqref{eq:hypsys} (not for \eqref{eq:prob1}) was shown
by Isaacson and Temple in \cite{IsaacsonTemple3}, see Karlsen
and Risebro \cite{KR:Rough_Diff} for the
multi-dimensional degenerate parabolic case.
For the case of a discontinuous coefficient, Towers \cite{TowersI} proved
convergence of the scalar Godunov and Engquist-Osher
methods for essentially the same concave problem studied
by Klingenberg and Risebro \cite{KlingbroI}, and using the
same version of the singular mapping as those authors. For
piecewise smooth solutions, uniqueness was establish via an $L^1$
stability proof similar to the classical proof of
Quinn \cite{Quinn} for the constant $\gamma$ conservation law.
For the Engquist-Osher scheme, Towers \cite{TowersII}
extended the convergence proof to the case of a
flux $f$ having any finite number of extrema. The question of uniqueness of
limits of the difference scheme was
not addressed for the nonconvex problem.
We plan to address this question in a later work,
which will also discuss uniqueness
for the more general problem \eqref{eq:prob1}.
Convergence of upwind finite difference approximations
for \eqref{eq:prob1} is proved  in \cite{KRT:FDM_degen}.


The singular mapping approach to
convergence for these scalar difference schemes appears to depend
strongly on the close functional relationship between the
viscosity of the Engquist-Osher flux, the Kru\v{z}kov entropy flux,
and the singular mapping. This is true even for the Godunov
scheme, where the proof depends on the fact that the
Engquist-Osher flux is nearly identical to the Godunov flux when
$f$ is concave. This reinforces our impression that the singular
mapping approach is not readily applicable to the Lax-Friedrichs
scheme, and further motivates our interest in the compensated
compactness approach.

The case where the flux $f$ is nonconvex has received less attention
in the literature than the convex/concave case, presumably due to
additional analytical complexity.  An attractive feature of the
vanishing viscosity/smoothing approach presented herein is that the
absence or presence of inflection points does not enter the
analysis, and so no convexity condition is required for the flux $f$.
The (small) price to pay for this is that we
must assume that there is no interval where $f$ is linear.
Also, sign changes of $\gamma$ are handled without any special
considerations.  Sign changes in $\gamma$ are commonly ruled out
\cite{KlingbroI,KlingbroII,KlausenRisebro,TowersI,TowersII}, again due
to added analytical technicalities.


\section{Compensated Compactness} \label{sec:CC}

In this section we recapitulate the results we shall use
from the compensated compactness
method due to Murat and Tartar \cite{MuratII,MuratI,Murat:Hneg,TartarI}.
For a nice overview of applications of the compensated
compactness method to hyperbolic conservation laws, we refer to
Chen \cite{Chen:LN}.

Let $\mathcal{M}(\mathbb{R}^n)$ denote the space of bounded Radon
measures on $\mathbb{R}^n$ and
$$
C_0(\mathbb{R}^n)=\big\{\Psi\in C(\mathbb{R}^n):
\lim_{|x|\to \infty} \Psi(x)=0\big\}.
$$
If $\mu\in \mathcal{M}(\mathbb{R}^n)$, then
$$
\bigl\langle \mu, \Psi \bigr\rangle= \int_{\mathbb{R}^n} \Psi \,d\mu,
\quad \text{for all}\quad \Psi \in C_0(\mathbb{R}^n).
$$
Recall that $\mu\in \mathcal{M}(\mathbb{R}^n)$ if and only if
$\left|\bigl\langle \mu, \Psi \bigr\rangle\right|
\le C \norm{\Psi}{L^{\infty}(\mathbb{R}^n)}$ for all
$\Psi \in C_{0}(\mathbb{R}^n)$.
We define
$$
\norm{\mu}{\mathcal{M}(\mathbb{R}^n)}=
\sup\left\{\left|\bigl\langle \mu, \Psi \bigr\rangle\right|:
\Psi\in C_0(\mathbb{R}^n), \norm{\Psi}{L^{\infty}(\mathbb{R}^n)}\le 1 \right\}.
$$
The space $\bigl(\mathcal{M}(\mathbb{R}^n),\norm{\cdot}{\mathcal{M}(\mathbb{R}^n)}\bigr)$
is a Banach space
and it is isometrically isomorphic to the dual space of
$\bigl(C_0(\mathbb{R}^n),\norm{\cdot}{L^{\infty}(\mathbb{R}^n)}\bigr)$, while we
define the space of probability measures $\mathrm{Prob}(\mathbb{R}^n)$  as
$$
\mathrm{Prob}(\mathbb{R}^n) = \left\{ \mu\in \mathcal{M}(\mathbb{R}^n): \text{$\mu$
is nonnegative and $\norm{\mu}{\mathcal{M}(\mathbb{R}^n)}=1$}\right\}.
$$
Then we can state the fundamental theorem in the theory of compensated
compactness.
\begin{theorem}\label{thm:Young}
   Let $K\subset \mathbb{R}$ be a bounded open set and $u_{\varepsilon}:\Pi_T\to K$.  Then
   there exists a family of probability
   measures $\{\nu_{(x,t)}(\lambda)\in
   \mathrm{Prob}(\mathbb{R}^n)\}_{(x,t)\in \Pi_T}$ (depending weak-$\star$ measurably on
   $(x,t)$) such that
   $$
   \mathrm{supp}\, \nu_{(x,t)}\subset \overline{K}\,\,\text{for a.e.~$(x,t)\in \Pi_T$}.
   $$
   Furthermore, for any continuous function $\Phi:K\to\mathbb{R}$, we have
   along a subsequence
   $$
   \Phi(u_{\varepsilon}) \overset{\star}\rightharpoonup \overline{\Phi}
   \,\, \text{in $L^{\infty}(\Pi_T)$ as $\varepsilon\downarrow 0$},
   $$
   where (the exceptional set depends possibly on $\Phi$)
   $$
   \overline{\Phi}(x,t):=\left\langle\nu_{(x,t)},\Phi\right\rangle
   =\int_{\mathbb{R}} \Phi(\lambda)\,d\nu_{(x,t)}(\lambda)\,\,
      \text{for a.e.~$(x,t)\in \Pi_T$}.
   $$
\end{theorem}
In the literature, $\nu_{(x,t)}$ is often referred to as a Young measure.
Theorem \ref{thm:Young} provides us with a representation
formula for weak limits in terms of nonlinear
functions and Young measures.
A uniformly bounded sequence $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$
converges to $u$ a.e.~on $\Pi_T$ if and only if
the corresponding Young measure $\nu_{(x,t)}$ reduces
to a Dirac measure located at $u(x,t)$, i.e.,
$\nu_{(x,t)}=\delta_{u(x,t)}$.

We have the following ``reduction'' result:
\begin{lemma}
   \label{reduction}
   Let $K\subset \mathbb{R}$ be a bounded open set and $u_{\varepsilon}:\Pi_T\to K$.
   Suppose that $u_{\varepsilon}\overset{\star}\rightharpoonup u$ in $L^{\infty}(\Pi_T)$.
   Suppose also
   that for any pair of (not necessarily convex) $C^2$ functions
   $\eta_1,\eta_2:\mathbb{R}\to\mathbb{R}$, we have along a subsequence
   \begin{equation}
      \label{red_assump}
      \gamma(x)q_1(u_{\varepsilon})\eta_2(u_{\varepsilon})
      - \eta_1(u_{\varepsilon}) \gamma(x)q_2(u_{\varepsilon})
      \overset{\star}\rightharpoonup
      \gamma(x)\,\overline{q_1}\,\overline{\eta_2}
      - \overline{\eta_1}\, \gamma(x)\,\overline{q_2} \,\,
      \text{in $L^{\infty}(\Pi_T)$ as $\varepsilon\downarrow 0$},
   \end{equation}
   where $q_i:\mathbb{R}\to \mathbb{R}$ is defined by $q_i'(u)=\eta_i'(u)f'(u)$, $i=1,2$.
   Then along a subsequence
   $$
   \gamma(x) f(u_{\varepsilon}) \overset{\star}\rightharpoonup \gamma(x)f(u)\,\,
   \text{in $L^{\infty}(\Pi_T)$  as $\varepsilon\downarrow 0$}.
   $$
   Furthermore, if $\gamma(x)\neq 0$ for a.e.~$x\in\mathbb{R}$
   and there is no interval on which $f(\cdot)$ is linear, then
   a subsequence of $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$ converges to $u$
   a.e.~on $\Pi_T$.
\end{lemma}
\begin{proof}
Applying Theorem \ref{thm:Young} for the sequence $\left\{u_{\varepsilon}\right\}$ with
$$
\Phi(\lambda)=q_1(\lambda) \eta_2(\lambda)-
\eta_1(\lambda)q_2(\lambda), 
$$
we get that, as $\varepsilon\downarrow 0$,
$$
\gamma(x)q_1(u_{\varepsilon})\eta_2(u_{\varepsilon})
- \eta_1(u_{\varepsilon}) \gamma(x)q_2(u_{\varepsilon})
\overset{\star}\rightharpoonup
\overline{\gamma(x)q_1\eta_2 - \eta_1\gamma(x)q_2}
\,\,
\text{in $L^{\infty}(\Pi_T)$}.
$$
{}From this and assumption \eqref{red_assump}, we get the following
Murat-Tartar commutation relation:
\begin{equation}
   \label{MT:relation}
   \gamma(x) \Bigl[ \overline{q_1}\,\overline{\eta_2}
   - \overline{\eta_1}\,\overline{q_2}
   - \overline{q_1\eta_2 - \eta_1q_2}\Bigr]=0
   \,\,\text{for a.e.~$(x,t)\in\Pi_T$.}
\end{equation}
Following Chen \cite{Chen:LN}, we choose
\begin{alignat*}{2}
   &\eta_1(\lambda)=\lambda - u(x,t), && \quad
   q_1(\lambda)=f(\lambda)-f(u(x,t)),\\
   &\eta_2(\lambda)=q_1(\lambda), && \quad
   q_2(\lambda)=\int_{u(x,t)}^{\lambda} \bigl(f'(\xi)\bigr)^2\, d\xi,
\end{alignat*}
and note that $\overline{\eta_1}\equiv 0$.
Inserting this choice into the
commutation relation \eqref{MT:relation} yields
\begin{multline}
   \label{MT:relation_nyI}
\gamma(x) \Bigl[ \Big(\int_{\mathbb{R}} \bigl(f(\lambda)-f(u(x,t))\bigr)
        \,d\nu_{(x,t)}(\lambda)\Big)^2 \\
      + \int_{\mathbb{R}} \Big( \bigl(\lambda - u(x,t)\bigr)\int_{u(x,t)}^{\lambda}
      \bigl(f'(\xi)\bigr)^2\, d\xi - \bigl(f(\lambda)-f(u(x,t))\bigr)^2
      \Big)\,d\nu_{(x,t)}(\lambda)\Bigr]=0.
\end{multline}
By the Cauchy-Schwartz inequality
$$
\left(f(\lambda)-f(u(x,t))\right)^2 =
\Big(\int_{u(x,t)}^{\lambda} f'(\xi)\, d\xi\Big)^2 \le
\bigl(\lambda-u(x,t)\bigr)
\int_{u(x,t)}^{\lambda} (f'(\xi))^2\, d\xi,
$$
with equality if and only if $f''(\xi)=0$ for all $\xi$ between $u(x,t)$
and $\lambda$. Hence, if $\gamma(x)\ne 0$, both terms in
\eqref{MT:relation_nyI} must be zero. The first term being zero
implies that $\overline{f}(x,t)=f(u(x,t))$.
Hence, by the boundedness of $\gamma$, we can conclude that
$\gamma(x)\overline{f} = \gamma(x)f(u)$ a.e.~on $\Pi_T$.
In view of Theorem \ref{thm:Young}, this proves the first
part of the proposition.

The second part of the theorem
follows by observing that if $\gamma,f''\not= 0$ a.e., then the
fact that the second term in \eqref{MT:relation_nyI}
is zero implies $\nu_{(x,t)}=\delta_{u(x,t)}$ a.e.~on $\Pi_T$ (since $f$ is
assumed to be genuinely nonlinear).
\end{proof}

\begin{remark}\normalfont
   If $\gamma(\cdot)=0$ on a set
   of non-zero measure, then it is not possible to
   conclude that (a subsequence of) $u_{\varepsilon}$ converges strongly
   to $u$ nor that $f(u_{\varepsilon})\overset{\star}\rightharpoonup
   f(u)$ in $L^{\infty}(\Pi_T)$.
   Nevertheless, Proposition \ref{reduction} can be used
   to prove that the $L^{\infty}(\Pi_T)$ weak-$\star$ limit
   $u$ is a weak solution of \eqref{eq:prob1}. Moreover, if this was
   our only goal, then we could have replaced the $C^2$ assumption
   on $f$ by merely $C^1$, or even Lipschitz. To see this,
   we do as Tartar did and insert the functions
   \begin{alignat*}{2}
      &\eta_1(\lambda)=\lambda, && \quad
      q_1(\lambda)=f(\lambda),\\
      &\eta_2(\lambda)=\abs{\lambda-u(x,t)}, && \quad
      q_2(\lambda)=\mathop{\rm sign}(\lambda-u(x,t))\bigl(f(\lambda)-f(u(x,t))\bigr)
  \end{alignat*}
  into the Murat-Tartar commutation relation \eqref{MT:relation}.
  Of course, now we suppose that
  \eqref{red_assump} holds for $\eta_1(\lambda)=\lambda$ and any
  convex (Lipschitz continuous) function $\eta_2:\mathbb{R}\to\mathbb{R}$.
  The result is
  \begin{multline*}
  \gamma(x)\Bigl[ \overline{f}\int_{\mathbb{R}} 
  \abs{\lambda-u(x,t)}\,d\nu_{(x,t)}(\lambda)
  - u\int_{\mathbb{R}} \mathop{\rm sign}(\lambda-u(x,t))
   \bigl(f(\lambda)-f(u(x,t))\bigr)
       \,d\nu_{(x,t)}(\lambda)
     \\
    - \int_{\mathbb{R}} \Bigl(f(\lambda)\abs{\lambda-u(x,t)}
     - \lambda\, \mathop{\rm sign}(\lambda-u(x,t))\bigl(f(\lambda)-f(u(x,t))\bigr)
     \Bigr)\,d\nu_{(x,t)}(\lambda)\Bigr]=0,
  \end{multline*}
  which can be rewritten as
  \begin{multline}
     \label{red_tmp_Tartar}
     \gamma(x) \int_{\mathbb{R}} \biggl(
        \bigl[\, \overline{f}(x,t)-f(\lambda)\bigr]\abs{\lambda-u(x,t)}
        \\
        +\bigl[\lambda - u(x,t)\bigr]
        \mathop{\rm sign}(\lambda-u(x,t))\bigl(f(\lambda)-f(u(x,t))\bigr)
        \biggr)\,d\nu_{(x,t)}(\lambda)=0,
  \end{multline}
  or
  $$
  \gamma(x)
  \bigl[f(u(x,t))-\overline{f}(x,t)\bigr]
  \int_{\mathbb{R}} \abs{\lambda-u(x,t)}\,d\nu_{(x,t)}(\lambda)=0.
  $$
  Consequently, we have
  either $\gamma(x)\overline{f}(x,t)=\gamma(x)f(u(x,t))$ or, if $\gamma(x)\ne 0$,
  $\overline{f}=f(u(x,t))$ or $\nu_{(x,t)}=\delta_{u(x,t)}$,
  which also implies $\gamma(x)\overline{f}(x,t)=\gamma(x)f(u(x,t))$.
  This proves our claim.
\end{remark}

Before we continue, we need to recall the celebrated Div-Curl lemma.

\begin{lemma}[Div-Curl]\label{lem:divcurl}
   Let $Q\subset \mathbb{R}^2$ be a bounded domain.
   Suppose
   \begin{align*}
      &v_{\varepsilon}^1 \rightharpoonup \overline{v}^1,
      \quad v_{\varepsilon}^2\rightharpoonup\overline{v}^2,  \\
      &w_{\varepsilon}^1 \rightharpoonup \overline{w}^1,
      \quad w_{\varepsilon}^2\rightharpoonup\overline{w}^2,
   \end{align*}
   in $L^2(Q)$ as $\varepsilon\downarrow 0$. Suppose also that the two
   sequences
   $\left\{\mathop{\rm div}\left(v_{\varepsilon}^1,
   v_{\varepsilon}^2\right)\right\}_{\varepsilon>0}$
   and
   $ \left\{ \mathop{\rm curl}\left(w_{\varepsilon}^1,
   w_{\varepsilon}^2\right)\right\}_{\varepsilon>0}$
   lie in a (common) compact subset of $H_{\mathrm{loc}}^{-1}(Q)$,
   where \\
   $\mathop{\rm div}\left(v_{\varepsilon}^1,v_{\varepsilon}^2\right)
   =\partial_{x_1}v_{\varepsilon}^1+\partial_{x_2}v_{\varepsilon}^2$
   and $\mathop{\rm curl}\left(w_{\varepsilon}^1,w_{\varepsilon}^2\right)
     =\partial_{x_1}w_{\varepsilon}^2-\partial_{x_2}w_{\varepsilon}^1$.
   Then along a subsequence
   $$
   \left(v_{\varepsilon}^1,v_{\varepsilon}^2\right)\cdot \left(w_{\varepsilon}^1,
   w_{\varepsilon}^2\right)
   \to \left(\overline{v}^1,\overline{v}^2\right)\cdot
   \left(\overline{w}^1,\overline{w}^2\right)\quad
   \text{in $\mathcal{D}^\prime(Q)$ as $\varepsilon\downarrow 0$.}
   $$
\end{lemma}

\begin{theorem}\label{Tartar}
   Suppose that $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}\subset L^{\infty}(\Pi_T)$
   uniformly in $\varepsilon$. Suppose also that for any $C^2$
   function $\eta:\mathbb{R}\to\mathbb{R}$, the sequence of distributions
   \begin{equation}
      \label{assumption:Hneg}
      \left\{\partial_t \eta(u_{\varepsilon}) +
      \partial_x \bigl(\gamma(x)q(u_{\varepsilon})\bigr)\right\}_{\varepsilon>0} \,\,
      \text{lies in a compact subset of $H_{\mathrm{loc}}^{-1}(\Pi_T)$},
   \end{equation}
   where $q:\mathbb{R}\to\mathbb{R}$ is defined by $q'(u)=\eta'(u)f'(u)$.  Then along a
   subsequence
   \begin{equation}
      \label{eq:limit}
      u_{\varepsilon}\overset{\star}\rightharpoonup u \,\,\text{in $L^{\infty}(\Pi_T)$
      as $\varepsilon\downarrow 0$},
      \quad \gamma(x)f(u_{\varepsilon}) \overset{\star}\rightharpoonup \gamma(x)f(u)\,\,
      \text{in $L^{\infty}(\Pi_T)$ as $\varepsilon\downarrow 0$}.
   \end{equation}
   Furthermore, if $\gamma(x)\neq 0$ for a.e.~$x\in\mathbb{R}$
   and there is no interval on which $f(\cdot)$ is linear, then
   a subsequence of $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$ converges to $u$
   a.e.~on $\Pi_T$.
\end{theorem}
\begin{proof}
Let $\eta_1,\eta_2:\mathbb{R}\to\mathbb{R}$ be a pair of $C^2$ functions
and define $q_i$ by $q_i'(u)=\eta_i'(u)f'(u)$, $i=1,2$.
Consider then the vector fields
$$
v_{\varepsilon}=\left(\eta_1(u_{\varepsilon}),\gamma(x)q_1(u_{\varepsilon})\right),\quad
w_{\varepsilon}=\left(-\gamma(x)q_2(u_{\varepsilon}),\eta_2(u_{\varepsilon})\right).
$$

In view of Theorem~\ref{thm:Young}, the $L^{\infty}$ bounds on $u_{\varepsilon}$
and $\gamma(x)$ imply that along subsequences
$$
v_{\varepsilon} \overset{\star}\rightharpoonup \overline{v}
:= \left(\overline{\eta_1},\gamma(x)\overline{q_1}\right)
\,\,\text{in $L^{\infty}(\Pi_T)$},\quad
w_{\varepsilon} \overset{\star}\rightharpoonup \overline{w}:= \left(-\gamma(x)\overline{q_2},
\overline{\eta_2}\right)
\,\,\text{in $L^{\infty}(\Pi_T)$}.
$$
By assumption \eqref{assumption:Hneg}, the sequences
\begin{align*}
   &\left\{\mathop{\rm div} \left(v_{\varepsilon}\right)\right\}_{\varepsilon>0}=
   \left\{\bigl(\partial_t \eta_1(u_{\varepsilon})
     + \partial_x \bigl(\gamma(x)q_1(u_{\varepsilon})\bigr)\right\}_{\varepsilon>0},\quad
   \\ & \left\{\mathop{\rm curl}\left(w_{\varepsilon}\right)\right\}_{\varepsilon>0} =
   \left\{\partial_t \eta_2(u_{\varepsilon})
   + \partial_x \bigl(\gamma(x)q_2(u_{\varepsilon})\bigr)\right\}_{\varepsilon>0}
\end{align*}
lie in a (common) compact subset of $H_{\mathrm{loc}}^{-1}(\Pi_T)$.
Also, we have $\left\{v_{\varepsilon}\right\}_{\varepsilon>0},
\left\{w_{\varepsilon}\right\}_{\varepsilon>0}
\subset L^{\infty}(\Pi_T)$ and therefore
$\left\{v_{\varepsilon}\right\}_{\varepsilon>0},
\left\{w_{\varepsilon}\right\}_{\varepsilon>0}\subset L^2_{\mathrm{loc}}(\Pi_T)$ uniformly
in $\varepsilon$. The Div-Curl lemma then gives (up to the
extraction of a subsequence)
$$
v_{\varepsilon}\cdot w_{\varepsilon} \to \overline{v}\cdot \overline{w}\quad
\text{in }\mathcal{D}^\prime(\Pi_T).
$$
Since we work with bounded functions, we have that
$\left\{v_{\varepsilon}\cdot w_{\varepsilon}\right\}_{\varepsilon>0}$
converges weakly-$\star$ in $L^{\infty}(\Pi_T)$ along
a subsequence to (necessarily) $\overline{v}\cdot \overline{w}$. Therefore
along a subsequence
$$
\gamma(x)q_1(u_{\varepsilon})\eta_2(u_{\varepsilon}) - \eta_1(u_{\varepsilon})
\gamma(x)q_2(u_{\varepsilon})
\overset{\star}\rightharpoonup  \gamma(x)\, \overline{q_1}\,\overline{\eta_2}
- \overline{\eta_1}\,\gamma(x)\,\overline{q_2}
\,\,\text{in $L^{\infty}(\Pi_T)$}.
$$
In view of Lemma \ref{reduction}, this concludes the proof.
\end{proof}

The following compactness interpolation result (known
as Murat's lemma \cite{Murat:Hneg}) is useful
in obtaining the $H_{\mathrm{loc}}^{-1}$ compactness needed in
Theorem \ref{Tartar}.
\begin{lemma}\label{Murat}
   Suppose that $\left\{\mathcal{L}_{\varepsilon}\right\}_{\varepsilon>0}$ is
   bounded in $W^{-1,\infty}(\Pi_T)$.
   Suppose also that $\mathcal{L}_{\varepsilon}=\mathcal{L}_{\varepsilon}^1
  + \mathcal{L}_{\varepsilon}^2$, where
   $\left\{\mathcal{L}_{\varepsilon}^1\right\}_{\varepsilon>0}$ lies in a compact
   subset of $H_{\mathrm{loc}}^{-1}(\Pi_T)$ and
   $\left\{\mathcal{L}_{\varepsilon}^2\right\}_{\varepsilon>0}$ lies in a
   bounded subset of $\mathcal{M}_{\mathrm{loc}}(\Pi_T)$. Then
   $\left\{\mathcal{L}_{\varepsilon}\right\}_{\varepsilon>0}$ lies in a compact
   subset of $H_{\mathrm{loc}}^{-1}(\Pi_T)$.
\end{lemma}


\section{Existence of Weak Solution} \label{sec:existence}

Existence of a weak solution will be proved by establishing convergence of
a suitable sequence of smooth functions solving regularized problems.
Let $\omega_{\varepsilon} \in C_0^{\infty}(\mathbb{R})$ be a nonnegative
function satisfying
$$
\omega(x)=\omega(-x), \quad
\omega(x)\equiv 0\quad
\text{for $|z|\geq 1$}, \quad
\int_{\mathbb{R}}\omega(z)\,dz=1.
$$
For $\varepsilon>0$, let $\omega_{\varepsilon}(x)=
\frac{1}{\varepsilon}\omega\left(\frac{x}{\varepsilon}\right)$ and
introduce the ``smoothed'' coefficient
$$
\gamma_{\varepsilon}=\omega_{\varepsilon}\star\gamma.
$$
Define the ``approximate'' initial function
$$
{u_0}_\varepsilon=\omega_{\varepsilon}\star u_0.
$$
Observe that ${u_0}_\varepsilon\in C^\infty(\mathbb{R})$ and
$$
{u_0}_\varepsilon\to u_0 \quad \text{a.e.~in $\mathbb{R}$ and in $L^p(\mathbb{R})$
for any $p\in [1,\infty)$ as $\varepsilon\downarrow 0$}.
$$
We then let $u_{\varepsilon}$ be the solution of
the uniformly parabolic problem
\begin{equation}
   \label{approx_problem}
   \begin{aligned}
      &\partial_t u_{\varepsilon}+\partial_x \bigl(\gamma_{\varepsilon}(x)
      f(u_{\varepsilon})\bigr)=
      \partial_x^2 A_{\varepsilon}(u_{\varepsilon}), \quad
      (x,t)\in \Pi_T, \\
      &u_{\varepsilon}(x,0)={u_0}_\varepsilon(x), \quad x\in \mathbb{R},
   \end{aligned}
\end{equation}
where $A_{\varepsilon}(u)=A(u) +\varepsilon u$.
According to \cite{LSU:67} there exists
a unique bounded classical ($C^{2,1}$)
solution $u_\varepsilon$ to \eqref{approx_problem}.
In what follows, we suppose that $u_\varepsilon$
vanishes sufficiently fast as $|x|\to \infty$.

Our goal is to
pass to the limit in $u_{\varepsilon}$ as $\varepsilon\downarrow 0$.
As was already mentioned in the introduction, our main problem
is the lack of a $BV$ estimate on $u_{\varepsilon}$ (which is
uniform in $\varepsilon$) and hence strong convergence
of $\{u_{\varepsilon}\}_{\varepsilon>0}$.  Instead, we
shall derive a series of a priori
estimates which will imply strong compactness of
$\{A(u_{\varepsilon})\}_{\varepsilon>0}$. This strong compactness
together with some a priori estimates on the ``total flux'' 
$$
\gamma_{\varepsilon}(x) f(u_{\varepsilon}) -
\partial_x A_{\varepsilon}(u_{\varepsilon})
$$ 
will make it possible for us to use the compensated
compactness method to obtain the
desired strong convergence. Finally, we will
prove (this is the easy part) that any
limit point of a convergent subsequence
of $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$ is a weak solution
of \eqref{eq:prob1}. Uniqueness of the constructed weak solution
is a direct consequence of a stability result
in \cite{KR:Rough_Unique}.
Before continuing, we mention that
the compensated compactness method has been
applied before to certain degenerate parabolic equations (with
smooth coefficients) by Zhao \cite{Zhao:CC} and Yin \cite{Yin:CC}.

Our first lemma gives uniform $L^1$ and $L^{\infty}$ estimates
on $u_{\varepsilon}$ (the proof of the latter
exploits assumption \eqref{f_ass}).

\begin{lemma}
   \label{lem:max}
   There exists a constant $C>0$, independent of $\varepsilon$, such that
   $$
   \norm{u_{\varepsilon}(\cdot,t)}{L^1(\mathbb{R})},\,\norm{u_{\varepsilon}
   (\cdot,t)}{L^{\infty}(\mathbb{R})}\le C,
   \quad \text{for all}\quad t\in (0,T).
   $$
\end{lemma}

\begin{proof}
{}From the $L^1$ contraction property proved in, e.g., \cite{KR:Rough_Unique}
it follows that
$$
\norm{u_{\varepsilon}(\cdot,t)}{L^1(\mathbb{R})}\le
\norm{u_{\varepsilon}(\cdot,0)}{L^1(\mathbb{R})},\quad
\text{for all}\quad t\in(0,T).
$$
Regarding the $L^{\infty}$ estimate, we will prove that if
$u_{0}(x)\in[0,1]$ for all $x$ then
$u_{\varepsilon}(x,t)\in [0,1]$ for all $(x,t)$. Our proof
is inspired by \cite{HRT-Max:95}.
For $\delta>0$, let $v$ solve the
auxiliary initial value problem
\begin{equation}
   \partial_t v+\partial_x\bigl(\gamma_{\varepsilon}(x)f(v)\bigr)
   =\partial_x^2 A_{\varepsilon}(v) +
   \delta h(v),\quad v(x,0)={u_0}_{\varepsilon}(x),
   \label{eq:vauxil}
\end{equation}
where the source $h(v):=1-2v$ satisfies
$h(0)=1>0$, $h(1)=-1<0$, and $h'=-2<0$.

{}From \cite{LSU:67} we know that there exists
a unique bounded classical ($C^{2,1}$)
solution $v$ to \eqref{eq:vauxil}.
Note that $v(x,0)\in [0,1]$ for all $x\in \mathbb{R}$.
Now suppose that there exists a compact set
$K\subset \Pi_{T}$ such that
$$
v(x,t)>1, \quad \forall (x,t)\in K.
$$
If $K$ is nonempty, set
$$
\bar{t}=\inf\left\{t: \exists \bar{x}, v(\bar{x},t)=1\right\}.
$$
Clearly, $\bar{t}>0$.
By compactness of $K$ and the smoothness of $v$ there
must be a point $\bar{x}$ such that $v(\cdot,\bar{t})$ has a local maximum
at $\bar{x}$ and $v(\bar{x},\bar{t})=1$. Furthermore,
$$
\partial_x v\left(\bar{x},\bar{t}\right)=0,\quad
\partial_x^2 v \left(\bar{x},\bar{t}\right)\le 0,\quad\text{and}\quad
\partial_t v\left(\bar{x},\bar{t}\right) \ge 0.
$$
Using \eqref{eq:vauxil} at $\left(\bar{x},\bar{t}\right)$,
$f\left(v\left(\bar{x},\bar{t}\right)\right)=f(1)=0$, and
$h\left(v\left(\bar{x},\bar{t}\right)\right)=h(1)=-1$, we find that
\begin{multline*}
   0 \le \partial_t v\left(\bar{x},\bar{t}\right) +
   \partial_x \gamma_{\varepsilon}(\bar{x})f\left(v\left(\bar{x},\bar{t}\right)\right) +
   \gamma_{\varepsilon}(\bar{x}) f'\left(v\left(\bar{x},\bar{t}\right)\right)
   \partial_x v\left(\bar{x},\bar{t}\right)\\
   =A_{\varepsilon}''\left(v\left(\bar{x},\bar{t}\right)\right)
   \left(\partial_x
      v\left(\bar{x},\bar{t}\right)\right)^2
   + A_{\varepsilon}'
   \left(v\left(\bar{x},\bar{t}\right)\right) \partial_x^2 v\left(\bar{x},\bar{t}\right)
   + \delta h\left(v\left(\bar{x},\bar{t}\right)\right)
   \le -\delta<0.
\end{multline*}
This contradiction implies $K=\emptyset$, and $v\le 1$ in
$\Pi_{T}$. Similarly one shows that $v\ge 0$ in $\Pi_{T}$.

Introduce the weight function
$$
W_\lambda(x)= \exp\big(-\lambda \sqrt{1+\abs{x}^2}\big), \quad
\lambda>0.
$$
It is not hard to modify the proof
of the continuous dependence estimate
in \cite{KR:Rough_Unique} so as to obtain, for
some constant $C>0$ depending on $\lambda$ (and possibly $\varepsilon$)
but not $\delta$,
$$
\iint_{\Pi_{T}} \left|u_\varepsilon(x,t) - v(x,t)\right|W_\lambda(x)\,dt\,dx
\le C\, T\, \delta,
$$
where $u_\varepsilon$ is the bounded $C^{2,1}$ function that solves
\eqref{approx_problem} and $v$ is the $C^{2,1}$ function that solves
\eqref{eq:vauxil}. Thus we have $v\to u_\varepsilon$
pointwise as $\delta \downarrow 0$, and $0\le v\le 1$ in $\Pi_{T}$
implies $0\le u_\varepsilon \le 1$ in $\Pi_{T}$.
\end{proof}

Our next lemma provides us with a uniform $L^2(\Pi_T)$ space and time translation
estimate on $A(u_{\varepsilon})$, and hence strong $L^2_{\mathrm{loc}}$ compactness
of $\{A(u_{\varepsilon})\}_{\varepsilon>0}$. Later we will use this lemma
to pass to the limit in the nonlinear diffusion term.

\begin{lemma}\label{lem:L2_comp_A}
   There exists a constant $C>0$ which
   depends on $T$ but not $\varepsilon$ such that
   \begin{equation}
      \label{eq:weak_spacetime}
      \bigl\|A(u_{\varepsilon}(\cdot+y,\cdot+\tau))-A(u_{\varepsilon}(\cdot,\cdot))
      \bigr\|_{L^2(\Pi_{T-\tau})}
      \le C \,\bigl(|y|+\sqrt{\tau}\bigr),
      \quad \text{$\forall y\in\mathbb{R}$ and $\forall \tau\ge 0$}.
   \end{equation}
   In particular, we have that $\left\{A(u_{\varepsilon})\right\}_{\varepsilon>0}$
   is strongly compact in $L^2_{\mathrm{loc}}(\Pi_T)$.
\end{lemma}

\begin{proof}
Multiply $\partial_t u_{\varepsilon}+\partial_x \bigl(\gamma_{\varepsilon}(x)
f(u_{\varepsilon})\bigr)=
\partial_x \bigl(A_{\varepsilon}'(u_{\varepsilon})\partial_x u_{\varepsilon}\bigr)$
by $u_{\varepsilon}$ and
then do integration by parts in $x$ to obtain
$$
\iint_{\Pi_T}\Bigl(\frac12 \partial_t
(u_{\varepsilon})^2 - \gamma_{\varepsilon}(x) f(u_{\varepsilon})\partial_x u_{\varepsilon}
+ A_{\varepsilon}'(u_{\varepsilon})(\partial_x u_{\varepsilon})^2\Bigr)\, dt\, dx=0.
$$
{}From this equality it follows that
\begin{multline*}
   \iint_{\Pi_T} A_{\varepsilon}'(u_{\varepsilon})
   (\partial_x u_{\varepsilon})^2\, dt\, dx \\
   = \frac12 \norm{u_{\varepsilon}(\cdot,0)}{L^2(\mathbb{R})}^2 -
   \frac12 \norm{u_{\varepsilon}(\cdot,t)}{L^2(\mathbb{R})}^2
   + \iint_{\Pi_T} \gamma_{\varepsilon}(x)
   \partial_x \mathcal{F}(u_{\varepsilon})\, dt\, dx,
\end{multline*}
where $\mathcal{F}(u_{\varepsilon}) = \int_0^{u_{\varepsilon}} f(\xi)\, d\xi$.
Integration by parts gives
$$
\Big|\iint_{\Pi_T} \gamma_{\varepsilon}(x) \partial_x \mathcal{F}(u_{\varepsilon})
\, dt\, dx\Big|
=\Big|\iint_{\Pi_T} \partial_x\gamma_{\varepsilon}(x)
\mathcal{F}(u_{\varepsilon}) \, dt\, dx \Big|
\le C \, T\, |\gamma|_{BV(\mathbb{R})},
$$
so that we end up with
$$
\iint_{\Pi_T} A_{\varepsilon}'(u_{\varepsilon})
(\partial_x u_{\varepsilon})^2\, dt\, dx
\le \frac12 \norm{u_{\varepsilon}(\cdot,0)}{L^2(\mathbb{R})}^2
+ C \, T\, |\gamma|_{BV(\mathbb{R})} \le C,
$$
where the constant does not depend $\varepsilon$.  From this and Lemma
\ref{lem:max}, we conclude that
\begin{equation}
    \iint_{\Pi_T}\bigl(\partial_x A(u_{\varepsilon})\bigr)^2\, dt\, dx
    \le \max_u A'(u)\iint_{\Pi_T} A'(u_{\varepsilon})
    (\partial_x u_{\varepsilon})^2\, dt\, dx \le C,
    \label{eq:NR}
\end{equation}
where the constant $C$ does not depend on $\varepsilon$. From this it
immediately follows that \eqref{eq:weak_spacetime} holds when
$\tau=0$.  To show that \eqref{eq:weak_spacetime} holds when $y=0$ we
calculate as follows
\begin{align*}
   &\iint_{\Pi_{T-\tau}} \Bigl(A(u_{\varepsilon}(x,t+\tau))
   -A(u_{\varepsilon}(x,t))\Bigr)^2\, dt\, dx
   \\ & \quad
   \le \|A\|_{\mathrm{Lip}} \iint_{\Pi_{T-\tau}} \left(\int_t^{t+\tau}
   \partial_t u_{\varepsilon}
     (x,\xi)\,d\xi\right)
   \left(A(u_{\varepsilon}(x,t+\tau))-A(u_{\varepsilon}(x,t))\right)\, dt\, dx
   \\ & \quad
   \le \|A\|_{\mathrm{Lip}} \iint_{\Pi_{T-\tau}} \left(\int_t^{t+\tau}
     \Bigl(-\partial_x \bigl(\gamma_{\varepsilon}(x,\xi) f(u_{\varepsilon}(x,\xi))\bigr)
     +\partial_x^2 A_{\varepsilon}(u_{\varepsilon}(x,\xi))\Bigr)\,d\xi\right)
   \\ & \quad\quad\quad\quad\quad\quad\quad\quad \times
   \Bigl(A(u_{\varepsilon}(x,t+\tau))-A(u_{\varepsilon}(x,t))\Bigr)\, dt\, dx
   \\ & \quad
   =\|A\|_{\mathrm{Lip}} \int_0^{\tau}\biggl\{\iint_{\Pi_{T-\tau}}
   \Bigl(-\partial_x \bigl(\gamma_{\varepsilon}(x,t+s) f(u_{\varepsilon}(x,t+s))\bigr)
   +\partial_x^2 A_{\varepsilon}(u_{\varepsilon}(x,t+s))\Bigr)
   \\ & \quad\quad\quad\quad\quad\quad\quad\quad \times
   \Bigl(A(u_{\varepsilon}(x,t+\tau))-A(u_{\varepsilon}(x,t))\Bigr)\, dt\, dx\biggr\}\,ds
   \\ & \quad
   \le \|A\|_{\mathrm{Lip}} \int_0^{\tau}\biggl\{\iint_{\Pi_{T-\tau}}
   \gamma_{\varepsilon}(x,t+s) f(u_{\varepsilon}(x,t+s))
   \\ & \quad\quad\quad\quad\quad\quad\quad\quad \times
   \Bigl(\partial_x A(u_{\varepsilon}(x,t+\tau))- \partial_x A(u_{\varepsilon}(x,t))
   \Bigr)\, dt\, dx
   \\ & \quad\quad
   + \iint_{\Pi_{T-\tau}} -\partial_x A_{\varepsilon}(u_{\varepsilon}(x,t+s))
   \Bigl(\partial_x A(u_{\varepsilon}(x,t+\tau))- \partial_x A(u_{\varepsilon}(x,t))
   \Bigr)\, dt\, dx\biggr\}\,ds
   \\ & \quad
   \le 2\|A\|_{\mathrm{Lip}} \tau \biggl\{\norm{\gamma_{\varepsilon}
   f(u_{\varepsilon})}{L^2(\Pi_T)}
   \norm{\partial_x A(u_{\varepsilon})}{L^2(\Pi_T)}
   \\ & \quad\quad\quad\quad\quad\quad\quad\quad
   +  \norm{\partial_x A_{\varepsilon}(u_{\varepsilon})}{L^2(\Pi_T)}
    \norm{\partial_x A(u_{\varepsilon})}{L^2(\Pi_T)}\biggr\}
   \le C\, \tau,
\end{align*}
where we have used the equation for $u_{\varepsilon}$ and H\"older's inequality.

Equipped with the uniform space and time translation estimate
\eqref{eq:weak_spacetime}, it is an easy exercise to use Kolmogorov's
compactness criterion to conclude the proof of the lemma.
\end{proof}
{}From Lemma \ref{lem:max} we know that
$M:=\norm{u_{\varepsilon}}{L^{\infty}(\Pi_T)}\le 1$ (uniformly in $\varepsilon$).
Let
$$
K=\max_{\lambda\in [0,1]}|A(\lambda)|=A(1).
$$
For any function $\Phi\in C\left(\left[0,K\right]\right)$,
we then have
$$
\norm{\Phi\left(A(u_{\varepsilon})\right)}{L^{\infty}(\Pi_T)}\le C,
$$
so that along a subsequence
\begin{equation}
    \label{weakstar_Phi_tmp}
    \Phi\left(A(u_{\varepsilon})\right) \overset{\star}\rightharpoonup
    \overline{\Phi} \ \,\, \text{in $L^{\infty}(\Pi_T)$},
\end{equation}
and, from Theorem \ref{thm:Young},
\begin{equation}
    \label{weakstar_Phi}
    \overline{\Phi}(x,t) = \int_{\mathbb{R}} \Phi\left(A(\lambda)\right) \,d\nu_{(x,t)}(\lambda),
    \quad \forall (x,t)\in \Pi_T\setminus N_{\Phi},
\end{equation}
for some exceptional set $N_{\Phi}$ that
depends possibly on $\Phi$ and $\abs{N_{\Phi}}=0$.  One can choose a sequence
$\{\Phi_j\}_{j=1}^{\infty}\subset C\left(\left[0,K\right]\right)$
(e.g., the polynomials with rational coefficients) that is dense in
$C\left(\left[0,K\right]\right)$ and set
\begin{equation}
   \label{Nset}
   N=\bigcup_{j=1}^{\infty} N_{\Phi_j}.
\end{equation}
Then $\abs{N}=0$ and
\begin{equation}
  \label{weakstar_Phi_ny}
  \text{\eqref{weakstar_Phi} holds
  at any point $(x,t)\in \Pi_T\setminus N$
  for each $\Phi\in C\left(\left[0,K\right]\right)$}.
\end{equation}
{}From Lemmas \ref{lem:max} and \ref{lem:L2_comp_A}, we know that
$A(u_{\varepsilon})$ converges along a subsequence to some 
function $\overline{A}$ a.e.~on
$\Pi_T$.  In view of \eqref{weakstar_Phi_ny}, we may assume without loss
of generality that
\begin{equation}
   \label{barA}
   \Psi\left(\overline{A}(x,t)\right)=
   \lim_{\varepsilon\downarrow 0} \Psi\left(A(u_{\varepsilon}(x,t)\right)) =
   \int_{\mathbb{R}} \Psi\left(A(\lambda)\right) \,d\nu_{(x,t)}(\lambda)\,\,
   \text{for all $(x,t)\in \Pi_T\setminus N$},
\end{equation}
for any $\Phi\in C\left(\left[0,K\right]\right)$.
Since $A(u_{\varepsilon}(x,t))\in \left[0,K\right]$ for all $\varepsilon>0$,
we have from \eqref{barA} (with $\Psi(\xi)=\xi$) that
$$
\overline{A}(x,t)\in \left[0,K\right]\,\,
\text{for all $(x,t)\in \Pi_T\setminus N$}.
$$
Let $u$ denote the $L^{\infty}(\Pi_T)$ weak-$\star$ limit of
$\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$.  We can assume without loss of
generality that
\begin{equation}
   \label{baru}
   u(x,t) = \int_{\mathbb{R}} \lambda \,d\nu_{(x,t)}(\lambda)\,\,
   \text{for all $(x,t)\in \Pi_T\setminus N$.}
\end{equation}
For $\xi\in [0,K]$, define the functions
\begin{equation}
   \label{lLdef}
   l(\xi)=\min\Bigl\{\lambda\in [0,1]: A(\lambda)=\xi\Bigr\},\quad
   L(\xi)=\max\Bigl\{\lambda\in [0,1]: A(\lambda)=\xi\Bigr\}.
\end{equation}
In the special case where $A(\cdot)$ is strictly increasing
(so that the inverse function
$A^{-1}(\cdot)$ exists), $l(\xi)=L(\xi)=A^{-1}(\xi)$
for all $\xi$. The function $l(\xi)$ is left-continuous and hence
lower semicontinuous, while the function $L(\cdot)$
is right-continuous and hence upper semicontinuous.
Furthermore,
\begin{align*}
   &l(A(\lambda))\le \lambda \le L(A(\lambda))
   \,\, \text{for all $\lambda\in [0,1]$},
   \\ & l(A(\lambda))=\lambda=L(A(\lambda))
   \,\, \text{for a.e.~$\lambda\in [0,1]$}.
\end{align*}
Observe that
\begin{equation}
   \label{lL_tmp}
   l\left(\overline{A}(x,t))\right)\le
   L\left(\overline{A}(x,t)\right)\,\,
   \text{for all $(x,t)\in \Pi_T\setminus N$}.
\end{equation}
For any $(x,t)\in \Pi_T\setminus N$, introduce
$$
I(x,t):=
\left[l\left(\overline{A}(x,t)\right),L\left(\overline{A}(x,t)\right)\right]
$$
and, in view of \eqref{lL_tmp}, observe that $I(x,t)$ is a single
point or a closed interval.  We shall also need the (measurable) sets
\begin{equation}
   \label{hyp_par_sets}
   \begin{aligned}
     H&:=\Bigl\{(x,t)\in \Pi_T\setminus N:
     l\left(A(u(x,t))\right)<L\left(A(u(x,t))\right)\Bigr\},
     \\
     P&:=\Bigl\{(x,t)\in \Pi_T\setminus N:
     l\left(A(u(x,t))\right)=L\left(A(u(x,t))\right)\Bigr\}.
   \end{aligned}
\end{equation}
We now have the following lemma:

\begin{lemma}
  \label{lem:Alimit_ident}
  We have
  \begin{itemize}
     \item[({\bf i})]  $\mathrm{supp}\, \nu_{(x,t)} \subseteq I(x,t)$ for
     all $(x,t)\in \Pi_T\setminus N$,
     \label{concl:a}

     \item[({\bf ii})] $\nu_{(x,t)}=\delta_{u(x,t)}$ for all $(x,t)\in P$, and
     \label{concl:b}

     \item[({\bf iii})] $\overline{A}(x,t)=A(u(x,t))$ for all $(x,t)\in \Pi_T\setminus N$.
     \label{concl:c}
  \end{itemize}
\end{lemma}
\begin{proof}
Suppose that there exists a point $(x_0,t_0)\in \Pi_T\setminus N$
such
$$
\mathrm{supp}\, \nu_{(x_0,t_0)} \not\subset I(x_0,t_0),
$$
which implies that
$$
\nu_{(x_0,t_0)}\Bigl([0,1] \setminus I(x_0,t_0) \Bigr)>0.
$$
Observing that
$$
A(\lambda)\neq \overline{A}(x_{0},t_{0}), \quad \forall \lambda\in
[0,1] \setminus I(x_0,t_0),
$$
we get, from \eqref{weakstar_Phi} (with $\Psi(\xi)=\abs{\xi-\overline{A}(x_0,t_0)}$)
\begin{align*}
   0 &\equiv \abs{\overline{A}(x_0,t_0) - \overline{A}(x_0,t_0)}
   =\int_{\mathbb{R}} \abs{A(\lambda) - \overline{A}(x_0,t_0)} \,d\nu_{(x_0,t_0)}(\lambda)
   \\ & \ge  \int_{[0,1] \setminus I(x_0,t_0)}
   \abs{A(\lambda) - \overline{A}(x_0,t_0)} \,d\nu_{(x_0,t_0)}(\lambda)>0,
\end{align*}
which is a contradiction. This proves~\ref{concl:a}.

Statement~\ref{concl:b} follows immediately from~\ref{concl:a}
since by \eqref{baru}, if $(x,t)\in P$ and $I(x,t)$ is a
single point,
$$
l\left(\overline{A}(x,t)\right)=L\left(\overline{A}(x,t)\right)=
\int_{\mathbb{R}} \lambda \,d\nu_{(x,t)}(\lambda)= u(x,t).
$$
{}From~\ref{concl:b} and \eqref{barA} (with $\Psi(\xi)=\xi$), we know
already that~\ref{concl:c} holds for all $(x,t)\in P$.  Let $(x,t)\in H$
and keep in mind that $I(x,t)$ is now an interval on which $A(\cdot)$
is constant.  Hence, from \eqref{barA} and \eqref{baru} we get
$$
\overline{A}(x,t)=\int_{I(x,t)} A(\lambda) \,d\nu_{(x,t)}(\lambda)=
A\Big(\int_{I(x,t)} \lambda \,d\nu_{(x,t)}(\lambda)\Big)
=A(u(x,t)).
$$
Thus, we have shown that~\ref{concl:c} holds for all $(x,t)\in
\left(H\bigcup P\right)=\Pi_T\setminus N$.
\end{proof}

\begin{remark}\normalfont
   Note statement~\ref{concl:b} of  Lemma~\ref{lem:Alimit_ident} implies that
   $\{u_{\varepsilon}\}_{\varepsilon>0}$ converges to $u$ a.e.~on $P$.  The proof of
   this claim is classical.  Let $K:=P\bigcap [a,b]$ for any
   $a,b\in\mathbb{R}$ (this is a measurable set), and note that
   $u_{\varepsilon}^2\overset{\star}\rightharpoonup
   u^2$ in $L^{\infty}(K)$.  Then we have
   \begin{align*}
      \iint_{K}\bigl(u_{\varepsilon}-u\bigr)^2\, dt\, dx
      =\iint_{K}
      \bigl(u_{\varepsilon}^2  - 2 u_{\varepsilon} u+u^2\Bigr)\, dt\, dx
      \to 0\,\, \text{as $\varepsilon\downarrow 0$},
   \end{align*}
   from which the claim follows.
\end{remark}

In the next lemma we sum up the compactness properties of the
``diffusion part'' of \eqref{approx_problem}.

\begin{lemma}
   \label{lem:A_conv}
   A subsequence of $\left\{A(u_{\varepsilon})\right\}_{\varepsilon>0}$
   converges strongly to $A(u)$ in $L^2_{\mathrm{loc}}(\Pi_T)$, where $u$
   is the $L^{\infty}(\Pi_T)$ weak-$\star$ limit
   of $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$. Furthermore,
   $$
   A(u)\in L^{\infty}(\Pi_T)\cap L^2(0,T;H^1(\mathbb{R})).
   $$
\end{lemma}

\begin{proof}
   The proof is an immediate consequence of
   Lemmas \ref{lem:L2_comp_A} and
   \ref{lem:Alimit_ident}.
\end{proof}
Before we continue, we shall need the following interpolation lemma
due to Kru\v{z}kov \cite{KruzkovII}:

\begin{lemma}[Kru\v{z}kov \cite{KruzkovII}]
   \label{lem:Kruzkov}
   Let $u(x,t)$ be a bounded measurable function defined on
   $\Pi_T$. Assume that there exists a nondecreasing continuous
   function (where we indicate the dependence on $u$ by
   writing~``$\,;u\,$'')
   $\nu(\cdot;u):[0,\infty)\to [0,\infty)$ such that $\nu(0;u)=0$ and
    \begin{equation}
         \int_{\mathbb{R}} \abs{u\left(x+y,t\right)-u(x,t)}\, dx \le
       \nu(\abs{y};u), \quad \forall y\in\mathbb{R}, \forall t\in(0,T).
        \label{eq:Kruzassume1}
    \end{equation}
    Suppose that for any
    $\phi\in C^{\infty}_0(\mathbb{R})$ and any $t_1$,$t_2$ $\in (0,T)$,
    \begin{equation}
      \label{eq:Kruzassume2}
      \Big|\int_{\mathbb{R}} \bigl(u\left(x,t_2\right)
          -u\left(x,t_1\right)\bigr)\phi(x)\, dx\Big| \le C
      \Bigl(\norm{\phi}{L^{\infty}(R)}
      + \norm{\partial_x\phi}{L^{\infty}(R)}\Bigr)\abs{t_2 -t_1},
    \end{equation}
    where the constant does not depend on $\phi$ or $t$.
    Then for any $t_1,t_2\in (0,T)$ and all $\varepsilon>0$
    \begin{equation}
       \label{eq:time-estimate}
       \int_{\mathbb{R}} \abs{u(x,t_2)-u(x,t_1)}\, dx \le
       C\Big(\frac{\abs{t_2-t_1}}{\varepsilon}
       +\nu(\varepsilon;u)\Big).
     \end{equation}
\end{lemma}

Our next lemma provides us with
a series of priori estimates that imply
strong compactness of the ``total flux'' sequence
$\left\{\gamma_{\varepsilon}(x)f(u_{\varepsilon}) -
\partial_x A_{\varepsilon}(u_{\varepsilon})\right\}_{\varepsilon>0}$.
However, these a priori estimates only hold if
the initial function $u_0$ satisfies, in
addition to \eqref{unull_ass}, the stronger regularity condition
\begin{equation}
   \label{smooth_data}
   \left|\gamma(x)f(u_0) - \partial_x A(u_0)\right|_{BV(\mathbb{R})}<\infty.
\end{equation}
In the proof of the next lemma, we shall
need the approximate sign function
\begin{align}
   \label{sgnappr}
   \mathrm{sign}_{\eta}(\xi) :=
   \begin{cases}
      \mathop{\rm sign}(\xi)  & \text{if $|\xi|>\eta$}, \\
      \xi/\eta & \text{if $|\xi|\leq \eta$},
   \end{cases}
   \quad \eta>0.
\end{align}
\begin{lemma}
   \label{flux_estimates}
   Suppose that \eqref{smooth_data} holds and introduce
   the function
   $$
   v_{\varepsilon}(x,t) = \gamma_{\varepsilon}(x)f(u_{\varepsilon}) -
   \partial_x A_{\varepsilon}(u_{\varepsilon}).
   $$
   There exists a constant $C>0$, independent of $\varepsilon$, such that
   for all $t\in (0,T)$
   \begin{itemize}
       \item[({\bf i})] \label{concl:tfea} $\norm{v_{\varepsilon}
       (\cdot,t)}{L^{\infty}(\mathbb{R})}\le C$,

       \item[({\bf ii})] \label{concl:tfeb} $\left|v_{\varepsilon}(\cdot,t)
       \right|_{BV(\mathbb{R})}\le C$,

       \item[({\bf iii})] \label{concl:tfec} $\norm{v_{\varepsilon}(\cdot,t+\tau)
       -v_{\varepsilon}(\cdot,t)}{L^1(\mathbb{R})}\le C\sqrt{\tau}, \,\,\forall \tau\ge 0$.
   \end{itemize}
   In particular, we have that $\left\{v_{\varepsilon}\right\}_{\varepsilon>0}$
   is strongly compact in $L^1_{\mathrm{loc}}(\Pi_T)$.
\end{lemma}

\begin{proof}
We rewrite $v_{\varepsilon}$ as
$$
v_{\varepsilon}(x,t) = \int^x \partial_t u_{\varepsilon} (\xi,t)\,d\xi,
$$
and observe that $v_{\varepsilon}$ satisfies the linear uniformly parabolic
equation
\begin{equation}
   \label{v_eqn}
   \partial_t v_{\varepsilon} + \gamma_{\varepsilon}(x) f'(u_{\varepsilon})
   \partial_x v_{\varepsilon}
   = \partial_x \bigl(A_{\varepsilon}'(u_{\varepsilon})\partial_x v_{\varepsilon}\bigr).
\end{equation}
Then the maximum principle for \eqref{v_eqn} gives
$$
\norm{v_{\varepsilon}(\cdot,t)}{L^{\infty}(\mathbb{R})}\le
\norm{v_{\varepsilon}(\cdot,0)}{L^{\infty}(\mathbb{R})}.
$$
We shall derive a $BV$ estimate for $v_{\varepsilon}$.  Differentiate
\eqref{v_eqn} with respect to $x$, set $w_{\varepsilon}=\partial_x
v_{\varepsilon}$, multiply with
$\mathrm{sign}_{\eta}(w_{\varepsilon})$, and  integrate over $(x,s)\in
\Pi_t:=\mathbb{R}\times[0,t]$.  The final result reads
\begin{multline*}
\iint_{\Pi_t} \Bigl(\partial_t w_{\varepsilon}
\mathrm{sign}_{\eta}(w_{\varepsilon})
+ \partial_x \bigl(\gamma_{\varepsilon}(x) f'(u_{\varepsilon}) w_{\varepsilon}\bigr)
\mathrm{sign}_{\eta}(w_{\varepsilon}) \\
- \partial_x^2 \bigl(A_{\varepsilon}'(u_{\varepsilon})
w_{\varepsilon}\bigr)\mathrm{sign}_{\eta}(w_{\varepsilon}) \Bigr)\, ds\, dx=0.
\end{multline*}
Since for each fixed $\varepsilon>0$, $\partial_x w_{\varepsilon}$ is summable,
\begin{multline*}
   \iint_{\Pi_t}
   \partial_x \bigl(\gamma_{\varepsilon}(x) f'(u_{\varepsilon}) w_{\varepsilon}\bigr)
   \mathrm{sign}_{\eta}(w_{\varepsilon})\, ds\, dx\\
   = - \iint_{\Pi_t} \gamma_{\varepsilon}(x) f'(u_{\varepsilon}) w_{\varepsilon}\,
   \mathrm{sign}_{\eta}'(w_{\varepsilon})\partial_x w_{\varepsilon}\, ds\, dx
   \to 0 \,\, \text{as $\eta\downarrow 0$}.
\end{multline*}
Similarly, for each fixed $\varepsilon>0$ we have
\begin{align*}
&\iint_{\Pi_t} \partial_x^2 \bigl(A_{\varepsilon}'(u_{\varepsilon})
   w_{\varepsilon}\bigr)\mathrm{sign}_{\eta}(w_{\varepsilon})\, ds\, dx\\
   &
   = - \iint_{\Pi_t}\partial_x \bigl( A_{\varepsilon}'(u_{\varepsilon})
   w_{\varepsilon}\bigr)
   \, \mathrm{sign}_{\eta}'(w_{\varepsilon})\partial_x w_{\varepsilon}\, ds\, dx
\\ &
   = - \iint_{\Pi_t}\partial_x A_{\varepsilon}'(u_{\varepsilon}) w_{\varepsilon}
   \, \mathrm{sign}_{\eta}'(w_{\varepsilon})\partial_x w_{\varepsilon}\, ds\, dx
   - \iint_{\Pi_t} A_{\varepsilon}'(u_{\varepsilon})
   \, \mathrm{sign}_{\eta}'(w_{\varepsilon})
   (\partial_x w_{\varepsilon})^2\, ds\, dx
   \\
   &\le - \iint_{\Pi_t}\partial_x A_{\varepsilon}'(u_{\varepsilon}) w_{\varepsilon}
   \, \mathrm{sign}_{\eta}'(w_{\varepsilon})\partial_x w_{\varepsilon}\, ds\, dx
   \to 0 \,\, \text{as $\eta\downarrow 0$},
\end{align*}
since $\partial_x A'(u_{\varepsilon})$ is bounded.  Finally,
\begin{align*}
   &\iint_{\Pi_t} \partial_t w_{\varepsilon}
   \mathrm{sign}_{\eta}(w_{\varepsilon})\, ds\, dx\\
   &=\iint_{\Pi_t} \partial_t
   \Big(\int_0^{w_{\varepsilon}(x,t)}\mathrm{sign}_{\eta}(\xi)\, d\xi\Big)\, ds\, dx
   \\ & = \int_{\mathbb{R}} \Big(\int_0^{w_{\varepsilon}(x,T)}\mathrm{sign}_{\eta}(\xi)
   \, d\xi\Big)\, dx
   - \int_{\mathbb{R}} \Big(\int_0^{w_{\varepsilon}(x,0)}\mathrm{sign}_{\eta}(\xi)
    \, d\xi\Big)\, dx.
   \\ &  \to  \int_{\mathbb{R}} \abs{w_{\varepsilon}(x,T)}\, dx
   - \int_{\mathbb{R}} \abs{w_{\varepsilon}(x,0)}\, dx\quad \text{as $\eta\downarrow 0$.}
\end{align*}
Summing up,
$\int_{\mathbb{R}} \abs{w_{\varepsilon}(x,t)}\, dx
\le \int_{\mathbb{R}} \abs{w_{\varepsilon}(x,0)}\, dx$.
{}From this we conclude that
$$
\left|v_{\varepsilon}(\cdot,t)\right|_{BV(\mathbb{R})}\le
\left|v_{\varepsilon}(\cdot,0)\right|_{BV(\mathbb{R})}.
$$
We next prove that $v_{\varepsilon}$ is $L^1$ H\"older continuous in time with
exponent $1/2$.  Multiplying \eqref{v_eqn} by a test function
$\varphi\in C^{\infty}_0$ and then do integration by parts, we get
\begin{align*}
   \int_{\mathbb{R}} \partial_t v_{\varepsilon} \varphi(x) &=
   -\int_{\mathbb{R}}\gamma_{\varepsilon}(x) f'(u_{\varepsilon})
   \partial_x v_{\varepsilon} \varphi(x)\, dx
   +\int_{\mathbb{R}} A_{\varepsilon}'(u_{\varepsilon})\partial_x v_{\varepsilon}
   \partial_x \varphi(x)\, dx
   \\ &
   \le C\Bigl(\norm{\varphi}{L^{\infty}(\mathbb{R})}
   + \norm{\partial_x \varphi}{L^{\infty}(\mathbb{R})} \Bigr),
\end{align*}
since $v_{\varepsilon}$ is of bounded variation.  Consequently,
$$
\int_{\mathbb{R}} \Bigl(v_{\varepsilon}(x,t+\tau)-v_{\varepsilon}(x,t)\Bigr)\varphi(x)\, dx
\le C\Bigl(\norm{\varphi}{L^{\infty}(\mathbb{R})} + \norm{\partial_x \varphi}{L^{\infty}(\mathbb{R})}
\Bigr)\tau.
$$
Using Kru\v{z}kov's interpolation lemma (Lemma \ref{lem:Kruzkov}), we
can conclude that
$$
\int_{\mathbb{R}} \bigl|v_{\varepsilon}(x,t+\tau)-v_{\varepsilon}(x,t)\bigr|\, dx\le C\sqrt{\tau}.
$$

The estimates~\ref{concl:tfea} --~\ref{concl:tfec} and an
application of Kolmogorov's compactness criterion concludes
the proof of the lemma.
\end{proof}

To be able to use the compensated compactness method to treat the
``nonlinear transport part'' of \eqref{approx_problem}, we need the
next lemma.
\begin{lemma}\label{Hneg_comp}
   Suppose that \eqref{smooth_data} holds. Then for any $C^2$ function
   $\eta:\mathbb{R}\to\mathbb{R}$, the sequence of distributions
   $$
   \left\{\partial_t \eta(u_{\varepsilon}) + \partial_x \bigl(\gamma(x)q(u_{\varepsilon})
   \bigr)\right\}_{\varepsilon>0} \,\,
   \text{lies in a compact subset of $H_{\mathrm{loc}}^{-1}(\Pi_T)$},
   $$
   where $q:\mathbb{R}\to \mathbb{R}$ is defined by $q'(u)=\eta'(u)f'(u)$.
\end{lemma}
\begin{proof}
Let us define the distribution $\mathcal{L}_{\varepsilon}$ by
$$
\left\langle \mathcal{L}_{\varepsilon}, \varphi \right\rangle
=\iint_{\Pi_T} \Bigl(\eta(u_{\varepsilon})\partial_t \varphi
+ \gamma(x) q(u_{\varepsilon}) \partial_x \varphi\Bigr)\, dt\, dx, \quad
\varphi\in \mathcal{D}(\Pi_T).
$$
Using the equation for $u_{\varepsilon}$
and the definition of $q$, in the sense of distributions we have
\begin{equation}
   \label{formal}
   \begin{split}
      &\partial_t \eta(u_{\varepsilon}) + \partial_x \bigl(\gamma(x)q(u_{\varepsilon})\bigr)
      \\ & \quad
      = \eta'(u_{\varepsilon})\partial_x^2 A_{\varepsilon}(u_{\varepsilon})+
      \partial_x \Bigl(\left[\gamma(x)-\gamma_{\varepsilon}(x)\right]q(u_{\varepsilon})\Bigr)
      + \gamma_{\varepsilon}'(x)\Bigl(q(u_{\varepsilon})-\eta'(u_{\varepsilon})
      f(u_{\varepsilon})\Bigr)
      \\ & \quad
      = \partial_x \Bigl(\eta'(u_{\varepsilon})\partial_x
      A_{\varepsilon}(u_{\varepsilon})\Bigr)
      - \eta''(u_{\varepsilon})A_{\varepsilon}'(u_{\varepsilon})
      \bigl(\partial_x u_{\varepsilon}\bigr)^2
      \\ & \quad \quad +\partial_x \Bigl([\gamma(x)-\gamma_{\varepsilon}(x)]
      q(u_{\varepsilon})\Bigr)
      + \gamma_{\varepsilon}'(x)\Bigl(q(u_{\varepsilon})
      -\eta'(u_{\varepsilon})f(u_{\varepsilon})\Bigr).
   \end{split}
\end{equation}
In view of \eqref{formal}, we therefore have
$$
\left\langle \mathcal{L}_{\varepsilon}, \varphi \right\rangle =
\left\langle \mathcal{L}_{\varepsilon}^1, \varphi \right\rangle
+\left\langle \mathcal{L}_{\varepsilon}^2, \varphi \right\rangle
+\left\langle \mathcal{L}_{\varepsilon}^3, \varphi \right\rangle
+\left\langle \mathcal{L}_{\varepsilon}^4, \varphi \right\rangle,
$$
where
\begin{alignat*}{2}
   &\left\langle \mathcal{L}_{\varepsilon}^1, \varphi \right\rangle
   =\iint_{\Pi_T}
   \eta'(u_{\varepsilon})\partial_x A_{\varepsilon}(u_{\varepsilon})
   \partial_x\varphi\, dt\, dx,
   \\ &
   \left\langle \mathcal{L}_{\varepsilon}^2, \varphi \right\rangle
    =\iint_{\Pi_T}
   \eta''(u_{\varepsilon})A_{\varepsilon}'(u_{\varepsilon})
   \bigl(\partial_x u_{\varepsilon}\bigr)^2 \varphi\, dt\, dx,
   \\&\left\langle \mathcal{L}_{\varepsilon}^3, \varphi \right\rangle
   =\iint_{\Pi_T}
   \left[\gamma(x)-\gamma_{\varepsilon}(x)\right]q(u_{\varepsilon})
   \partial_x \varphi\, dt\, dx,
   \\ &
   \left\langle \mathcal{L}_{\varepsilon}^4, \varphi \right\rangle
   =-\iint_{\Pi_T}
   \gamma_{\varepsilon}'(x)\Bigl(q(u_{\varepsilon})
   -\eta'(u_{\varepsilon})f(u_{\varepsilon})\Bigr)\varphi\, dt\, dx.
\end{alignat*}
Using Lemma \ref{lem:max} and \eqref{eq:NR}, we get
$$
\Big|\iint_{\Pi_T}
   \eta''(u_{\varepsilon})A_{\varepsilon}'(u_{\varepsilon})
   \bigl(\partial_x u_{\varepsilon}\bigr)^2 \, dt\, dx\Big|\le C,
$$
and hence $\left|\left\langle \mathcal{L}_{\varepsilon}^2, \varphi \right\rangle\right|
\le C \norm{\varphi}{L^{\infty}(\Pi_T)}$.
Again thanks to to Lemma \ref{lem:max} and the fact
that $\left|\gamma_{\varepsilon}\right|_{BV(\mathbb{R})}$ is bounded uniformly
with respect to $\varepsilon$, we also have
$$
\left|\left\langle \mathcal{L}_{\varepsilon}^4, \varphi \right\rangle\right|
\le C \norm{\varphi}{L^{\infty}(\Pi_T)}.
$$
Therefore $\norm{\mathcal{L}_{\varepsilon}^2
+ \mathcal{L}_{\varepsilon}^4}{\mathcal{M}(\Pi_T)} \le C$, i.e.,
$\left\{\mathcal{L}_{\varepsilon}^2
+ \mathcal{L}_{\varepsilon}^4 \right\}_{\varepsilon>0}$
is bounded in $\mathcal{M}(\Pi_T)$

Next, we have
$$
\left|\left\langle \mathcal{L}_{\varepsilon}^3, \varphi \right\rangle\right|
\le \norm{\gamma - \gamma_{\varepsilon} }{L^2(\Pi_T)}\norm{\partial_x\varphi}{L^2(\Pi_T)}
\to 0\,\, \text{as $\varepsilon\downarrow 0$},
$$
so that $\left\{\mathcal{L}_{\varepsilon}^3\right\}_{\varepsilon>0}$ is compact
in $H_{\mathrm{loc}}^{-1}(\Pi_T)$.
Finally, let us consider $\mathcal{L}_{\varepsilon}^1$.  We write
$$
\left\langle \mathcal{L}_{\varepsilon}^1, \varphi \right\rangle =
\left\langle \mathcal{L}_{\varepsilon}^{1,1}, \varphi \right\rangle
+\left\langle \mathcal{L}_{\varepsilon}^{1,2}, \varphi \right\rangle,
$$
where
\begin{align*}
   \left\langle \mathcal{L}_{\varepsilon}^{1,1}, \varphi \right\rangle
   =\iint_{\Pi_T}
   \eta'(u_{\varepsilon})\partial_x A(u_{\varepsilon}) \partial_x \varphi\, dt\, dx, \quad
   \left\langle \mathcal{L}_{\varepsilon}^{1,2}, \varphi \right\rangle
   =\iint_{\Pi_T}
   \eta'(u_{\varepsilon})\varepsilon \partial_x u_{\varepsilon} 
   \partial_x \varphi\, dt\, dx.
\end{align*}
Using \eqref{eq:NR} once more, we get
$$
   \left|\left\langle \mathcal{L}_{\varepsilon}^{1,2}, \varphi \right\rangle\right|
   \le C\sqrt{\varepsilon}\norm{\partial_x\varphi}{L^2(\Pi_T)}
   \to 0\,\, \text{as $\varepsilon\downarrow 0$},
$$
so that also
$\left\{\mathcal{L}_{\varepsilon}^{1,2}\right\}_{\varepsilon>0}$
is compact in $H_{\mathrm{loc}}^{-1}(\Pi_T)$.

In what follows, we use the term ``converges'' as shorthand for
``converges along a subsequence''.  The semicontinuity of $l(\cdot)$
and $L(\cdot)$ implies that
$$
l(\xi) \le \liminf_{\eta\to \xi} l(\eta), \quad
L(\xi) \ge \limsup_{\eta\to \xi} L(\eta).
$$
In addition, we have
$$
l\left(A(u_{\varepsilon}(x,t))\right)\le u_{\varepsilon}(x,t)\le
L\left(A(u_{\varepsilon}(x,t))\right)\,\,
\text{for all $(x,t)\in \Pi_T$ and $\varepsilon>0$}.
$$
Consequently,
\begin{equation}
   \label{liminfsup}
   \begin{split}
      & \liminf_{\varepsilon\downarrow 0} u_{\varepsilon}(x,t) 
      \ge l\left(A(u(x,t))\right)
      \,\,\text{for a.e.~$(x,t)\in \Pi_T$}, \\
      & \limsup_{\varepsilon\downarrow 0} u_{\varepsilon}(x,t) \le
      L\left(A(u(x,t))\right)\,\,\text{for a.e.~$(x,t)\in \Pi_T$}.
   \end{split}
\end{equation}
By \eqref{liminfsup}, and since
$$
\text{$A'(\lambda)=0$ for all $\lambda\in [0,1]$ such
that $l(A(\lambda))<L(A(\lambda))$},
$$
it follows that
$$
A'(u_{\varepsilon})\to 0\,\, \text{a.e.~on $H$ as $\varepsilon\downarrow 0$}.
$$
Therefore, in view of Lemma \ref{lem:max} and \eqref{eq:NR}, 
as $\varepsilon\downarrow 0$,
\begin{align*}
   &\iint_{H\cap [a,b]}
   \left|\eta'(u_{\varepsilon})A'(u_{\varepsilon})
   \partial_x u_{\varepsilon} \right|\, dt\, dx
   \\ &
   \le C\, \Big(\iint_{H\bigcap [a,b]}
   A'(u_{\varepsilon})\, dt\, dx\Big)^{1/2}
   \Big(\iint_{H\bigcap [a,b]} A'(u_{\varepsilon})
   \bigl(\partial_x u_{\varepsilon}\bigr)^2
   \, dt\, dx\Big)^{1/2}\to 0,
\end{align*}
for any interval
$[a,b]\subset \mathbb{R}$. Hence
$$
\eta'(u_{\varepsilon})\partial_x A(u_{\varepsilon}) \to 0\,\,\text{a.e.~on $H$
as $\varepsilon\downarrow 0$}.
$$

On the other hand, Lemma \ref{lem:Alimit_ident} shows that
$\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$ converges
a.e.~on $P$. From Lemma~\ref{flux_estimates}, we have that
$$
\left\{\gamma_{\varepsilon}(x)f(u_{\varepsilon})
- \partial_x A_{\varepsilon}(u_{\varepsilon})\right\}_{\varepsilon>0}\,\,
\text{converges a.e.~on $\Pi_T$}.
$$
Since $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$
converges a.e.~on $P$, we conclude that
$$
\left\{\eta'(u_{\varepsilon})\partial_x A_{\varepsilon}(u_{\varepsilon})
\right\}_{\varepsilon>0}\,\,
\text{converges a.e.~on $P$}.
$$
Since $\partial_x A_{\varepsilon}(u_{\varepsilon})= \partial_x A(u_{\varepsilon})
+ \varepsilon \partial_x u_{\varepsilon}$ and $\eta'(u_{\varepsilon})\varepsilon
\partial_x u_{\varepsilon} \to 0$ a.e.~on $\Pi_T$, we conclude that also
$$
\left\{\eta'(u_{\varepsilon})\partial_x A(u_{\varepsilon})\right\}_{\varepsilon>0}\,\,
\text{converges a.e.~on $P$}.
$$
Hence we have shown that
$\{\eta'(u_{\varepsilon})\partial_x A(u_{\varepsilon})\}_{\varepsilon>0}$
converges a.e.~on $H\cup P=\Pi_T\setminus N$
(and hence a.e.~on $\Pi_T$).
Moreover, from Lemma \ref{lem:max} and \eqref{eq:NR},
$\eta'(u_{\varepsilon})\partial_x A(u_{\varepsilon})\in L^2(\Pi_T)$.
Consequently,
$$
\left\{\eta'(u_{\varepsilon})\partial_x A(u_{\varepsilon})\right\}_{\varepsilon>0}\,\,
\text{converges strongly in $L^2(\Pi_T)$},
$$
and $\left\{\mathcal{L}_{\varepsilon}^{1,1}\right\}_{\varepsilon>0}$
belongs to a compact subset of $H_{\mathrm{loc}}^{-1}(\Pi_T)$.

Summing up, we have proved that the sequence of distributions
$\left\{\mathcal{L}_{\varepsilon}\right\}_{\varepsilon>0}$ is
the sum of two terms, one which is
compact in $H_{\mathrm{loc}}^{-1}(\Pi_T)$ and one
which is bounded in $\mathcal{M}(\Pi_T)$.
In addition, Lemma \ref{lem:max} implies that
$\left\{\mathcal{L}_{\varepsilon}\right\}_{\varepsilon>0}$
belongs to a bounded subset of $W^{-1,\infty}(\Pi_T)$.
Hence, the proof of the lemma is now finished by appealing to
Lemma \ref{Murat}.
\end{proof}

Our main result is the following theorem:

\begin{theorem}\label{main_thm}
   Suppose that conditions \eqref{gamma_ass}--\eqref{unull_ass}
   hold. Then there exists a weak solution (in the sense of
   Definition \ref{weak_def}) of the
   Cauchy problem \eqref{eq:prob1}.
   Furthermore, $u$ can be constructed as
   the strong limit of the sequence $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$,
   where $u_{\varepsilon}$ solves the regularized problem \eqref{approx_problem}.

   Let $v$ be another weak solution constructed as the strong limit of
   the sequence $\{v_{\varepsilon}\}_{\varepsilon>0}$, where $v_{\varepsilon}$  solves
   the regularized problem \eqref{approx_problem}
   corresponding to initial data $v_0$. Then
   \begin{equation}
      \label{stab}
      \int_{\mathbb{R}} \abs{u(x,t)-v(x,t)}\, dx \le
      \int_{\mathbb{R}} \abs{u_0(x)-v_0(x)}\, dx.
   \end{equation}
   Consequently, the constructed weak
   solution $u$ of \eqref{eq:prob1} is unique.

   Suppose that the initial function $u_0$ satisfies the
   additional regularity condition stated in
   \eqref{smooth_data}. Then the constructed weak solution $u$
   has the following regularity properties:
   \begin{itemize}
       \item[({\bf i})] \label{concl:flux_BV}
         $\left|\bigl(\gamma(x) f(u) - \partial_x A(u)\bigr)(\cdot,t)
         \right|_{BV(\mathbb{R})}\le C$,
         \,\,$\forall t\in (0,T)$.

       \item[({\bf ii})] \label{concl:L1_Lip}
         $\norm{u(\cdot,t+\tau)-u(\cdot,t)}
       {L^1(\mathbb{R})}\le C\tau, \,\,\forall \tau\ge 0$.
   \end{itemize}
\end{theorem}

\begin{proof}
First, let us assume that the additional regularity condition in
\eqref{smooth_data} holds.  By Lemma~\ref{Hneg_comp} and
Theorem~\ref{Tartar}, we have that
$$
u_{\varepsilon} \to u \,\, \text{along a
subsequence a.e.~in $\Pi_T$ as $\varepsilon\downarrow 0$}.
$$
Lemma \ref{lem:max} states that the limit $u$ belongs to
$L^1(\Pi_T)\bigcap L^{\infty}(\Pi_T)$, so that the convergence holds true
in $L^p(\Pi_T)$ for any $p\in [1,\infty)$.  From Lemma \ref{lem:A_conv},
it follows that $A(u)\in L^2(0,T;H^1(\mathbb{R}))$.  Hence, the limit $u$
satisfies \ref{def:weak1}.  Multiplying the equation for $u_{\varepsilon}$ by a
test function $\varphi\in \mathcal{D}(\mathbb{R}\times [0,T))$ and then
do integration by parts in $x$ and $t$, we get
\begin{align*}
   &\iint_{\Pi_T}\Bigl(u\partial_t \varphi
   + \gamma_{\varepsilon}(x)f(u_{\varepsilon})\partial_x \varphi
   + \left(A(u_{\varepsilon}) + \varepsilon u_{\varepsilon}\right)
   \partial_x^2\varphi\Bigr)\, dt\, dx
   \\ & \qquad 
   + \int_{\mathbb{R}} {u_0}_\varepsilon(x)\,\phi(x,0)\,dx= 0.
\end{align*}
Sending $\varepsilon\downarrow 0$, it follows (after an integration by parts) that
the limit $u$ satisfies \ref{def:weak2}. In addition,
({\bf i}) and ({\bf ii}) are direct
consequences of Lemma \ref{flux_estimates}.
This concludes the proof when \eqref{smooth_data} holds.

We will now remove the extra assumption \eqref{smooth_data} by using a
stability result for ``smooth'' $\gamma(\cdot)$ found in
\cite{KR:Rough_Unique}, which tells us that
$\int_{\mathbb{R}} \abs{u_{\varepsilon}(x,t)-v_{\varepsilon}(x,t)}
\, dx \le \int_{\mathbb{R}}
\abs{u_{\varepsilon}(x,0)-v_{\varepsilon}(x,0)}\, dx$, where $v_{\varepsilon}$
solves \eqref{approx_problem} corresponding
to initial data $v_0$ satisfying \eqref{smooth_data}.
Sending $\varepsilon\downarrow 0$ yields \eqref{stab}
whenever $u_0,v_0$ satisfy \eqref{smooth_data}.  If $u_0$ satisfies
\eqref{unull_ass}, we can certainly find a sequence
$\left\{u_0^m\right\}_{m=1}^{\infty}$ such that each $u_0^m$ satisfy
\eqref{smooth_data} and $u_0^m\to u_0$ in $L^1(\mathbb{R})$ as
$m\uparrow\infty$.  Let $u^{\varepsilon}$ be a weak solution of \eqref{eq:prob1} with
initial data $u_0^m$.  Using \eqref{stab}, we get
$$
\int_{\mathbb{R}} \abs{u^m(x,t)-u^n(x,t)}\, dx \le
\int_{\mathbb{R}} \abs{u_0^m(x)-u_0^n(x)}\, dx \to 0 \,\,
\text{as $m,n\uparrow \infty$}.
$$
Hence $\left\{u^m\right\}_{m=1}^{\infty}$ is a Cauchy sequence in
$L^1(\Pi_T)$.  It is not difficult to check that the limit $u$ of this
sequence satisfies \ref{def:weak1} and \ref{def:weak2}.  This
concludes the proof of the theorem.
\end{proof}

\begin{remark}\normalfont
   In the pure hyperbolic case, Theorem \ref{main_thm} ({\bf i})
   implies that the total variation of $f(u)$
   is finite if $u_0\in BV(\mathbb{R})$ (recall
   that $\gamma \not=0$ a.e.), although the total variation
   of $u$ need not be finite. This fact has already been established
   by Klausen and Risebro \cite{KlausenRisebro}.
   However, their proof is much more complicated than the
   elementary proof given here (see the proof
   of Lemma \ref{flux_estimates}).
\end{remark}

\begin{remark}\normalfont
  It is worthwhile mentioning that if $A(\cdot)$ is strictly increasing we do
  not need the compensated compactness method to get strong convergence
  of $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$.  This is the typical situation that
  one has to deal with in models for two-phase flow in porous media
  (see, e.g., \cite{EspKar}).  In this case, we have strong $L^2_{\mathrm{loc}}$
  convergence of $\left\{u_{\varepsilon}\right\}_{\varepsilon>0}$ directly from Lemma
  \ref{lem:Alimit_ident}.
\end{remark}
Provided the initial function $u_0$ is sufficiently smooth, it is
possible to upgrade the strong $L^2$ compactness of
$\left\{A(u_{\varepsilon})\right\}_{\varepsilon>0}$ to strong compactness in the H\"older
space $C^{1,\frac12}$.  This is the content of the following
proposition, which also shows that $A(u)$ is H\"older continuous,
i.e., significantly more regular than anticipated by Definition
\ref{weak_def}.
\begin{prop}
   \label{prop:A_Holder}
   Suppose that conditions \eqref{gamma_ass}-\eqref{unull_ass}
   hold. In addition, suppose that \eqref{smooth_data} holds.
   Then there exists a constant $C$, independent of
   $\varepsilon$, such that
   $$
   \Bigl|A_\varepsilon(u_{\varepsilon}(x+y,t+\tau))
   -A_\varepsilon(u_{\varepsilon}(x,t))\Bigr|
   \le C\Bigl(\abs{y}+ \sqrt{\tau}\Bigr),
   $$
   for all $y\in \mathbb{R}$ and $\tau\ge 0$ with $t+\tau<T$.
   In particular, $\left\{A_\varepsilon(u_{\varepsilon})\right\}_{\varepsilon>0}$
   converges along a subsequence to some function $\overline{A}$
   uniformly on compact subsets of $\Pi_T$ as $\varepsilon\downarrow 0$ and
   $$
   \overline{A}\in C^{1,\frac12}(\Pi_T).
   $$
   If $u$ denotes the weak solution in Theorem \ref{main_thm}, then
   $\overline{A}=A(u)$ a.e.~on $\Pi_T$.
\end{prop}
\begin{proof}
Since $u_{\varepsilon},\gamma_{\varepsilon}(x)f(u_{\varepsilon})$ are
uniformly bounded, we get
from Lemma \ref{concl:tfea} ({\bf i})
$$
\norm{\partial_x A_{\varepsilon}(u_{\varepsilon}(\cdot,t))}{L^{\infty}(\mathbb{R})}\le C, \quad
\forall t\in (0,T).
$$
{}From this estimate and the $L^{\infty}$ bound on $u_{\varepsilon}$, we get
\begin{equation}
   \label{Holder_space}
   A_{\varepsilon}(u_{\varepsilon}(x+y,t))
   -A_{\varepsilon}(u_{\varepsilon}(x,t))\le C \abs{y}.
\end{equation}
Following Zhao \cite{Zhao:CC}, we show next that
$A_{\varepsilon}(u_{\varepsilon})$ is H\"older continuous in time.
To this end, let $\tau>0$ and note that
\begin{align*}
   &\int_x^{x+\sqrt{\tau}}
   \Bigl(u_{\varepsilon}(x,t+\tau) - u_{\varepsilon}(x,t)\Bigr)\, dx
    = \int_x^{x+\sqrt{\tau}} \int_{t}^{t+\tau}
   \partial_t u_{\varepsilon} (x,\xi)\, d\xi\, dx
   \\
   &\quad = \int_x^{x+\sqrt{\tau}} \int_{t}^{t+\tau}
   \Bigl(- \partial_x \bigl(\gamma_{\varepsilon}(x)f(u_{\varepsilon}(x,\xi))
   + \partial_x^2 A_{\varepsilon}(u_{\varepsilon}(x,\xi))\bigr)\Bigr)\, d\xi \, dx
   \\ &\quad =
   \int_{t}^{t+\tau}\biggl(
   \Bigl[- \gamma_{\varepsilon}(x)f(u_{\varepsilon}(x,\xi))\Bigr]_x^{x+\sqrt{\tau}}
   + \Bigl[\partial_x A_{\varepsilon}(u_{\varepsilon}(x,\xi))
    \Bigr]_x^{x+\sqrt{\tau}}\biggr)\, d\xi\, dx
   \\ & \quad \le C \bigl(t+\tau-t\bigr)=C\tau.
\end{align*}
By the mean value theorem there exists an
$x^*$ between $x$ and $x+\sqrt{\tau}$ such that
$$
\Bigl(u_{\varepsilon}(x^*,t+\tau) - u_{\varepsilon}(x^*,t)\Bigr)\sqrt{\tau}\le C\tau
\Longrightarrow \Bigl|u_{\varepsilon}(x^*,t+\tau) - u_{\varepsilon}(x^*,t)\Bigr| \le
C\sqrt{\tau}.
$$
Consequently, we can calculate as follows
\begin{equation}
   \label{Holder_time}
   \begin{split}
      &\Bigl|A_{\varepsilon}(u_{\varepsilon}(x,t+\tau))
      -A_{\varepsilon}(u_{\varepsilon}(x,t))\Bigr|
      \\ & \quad
      \le \Bigl|A_{\varepsilon}(u_{\varepsilon}(x,t+\tau))
      -A_{\varepsilon}(u_{\varepsilon}(x^*,t+\tau))\Bigr|
      +\Bigl|A_{\varepsilon}(u_{\varepsilon}(x^*,t+\tau))
      -A_{\varepsilon}(u_{\varepsilon}(x^*,t))\Bigr|
      \\&\quad\quad\quad
      +\Bigl|A_{\varepsilon}(u_{\varepsilon}(x^*,t))
      -A_{\varepsilon}(u_{\varepsilon}(x,t))\Bigr|
      \\ & \quad \le C\Bigl(|x-x^*| + \tau^{1/2} + |x-x^*|  \Bigr)
      \le C \sqrt{\tau}.
   \end{split}
\end{equation}

In view of \eqref{Holder_space} and \eqref{Holder_time}, an application
of the Ascoli-Arzela compactness criterion
concludes the proof of the proposition.
\end{proof}

\noindent\textbf{Acknowledgment:}
This work has been supported by the
BeMatA program of the Research Council of Norway. This work was
done while K.~H.~Karlsen was visiting the Institute for Pure and
Applied Mathematics (IPAM) at the University of California  Los
Angeles (UCLA). K.~H.~Karlsen is grateful to IPAM for their
hospitality and financial support.


\begin{thebibliography}{10}

\bibitem{Carrillo}
J.~Carrillo.
\newblock Entropy solutions for nonlinear degenerate problems.
\newblock {\em Arch. Rational Mech. Anal.}, 147(4):269--361, 1999.

\bibitem{Chen:LN}
G.-Q. Chen.
\newblock Compactness methods and nonlinear hyperbolic conservation laws.
\newblock In {\em Some current topics on nonlinear conservation laws}, pages
  33--75. Amer. Math. Soc., Providence, RI, 2000.

\bibitem{ChenDiBen}
G.-Q. Chen and E.~DiBenedetto.
\newblock Stability of entropy solutions to the {C}auchy problem for a class of
  hyperbolic-parabolic equations.
\newblock Preprint, 1999.
\newblock To appear in SIAM J. Math. Anal.

\bibitem{Dafermos}
C.~M. Dafermos.
\newblock Polygonal approximation of solutions of the initial value problem for
  a conservation law.
\newblock {\em J. Math. Anal. Appl.}, 38:33--41, 1972.

\bibitem{EspKar}
M.~S. Espedal and K.~H. Karlsen.
\newblock Numerical solution of reservoir flow models based on large time step
  operator splitting algorithms.
\newblock In {\em Filtration in Porous Media and Industrial Applications
  (Cetraro, Italy, 1998)}, volume 1734 of {\em Lecture Notes in Mathematics},
  pages 9--77. Springer, Berlin, 2000.

\bibitem{Gimsebro:Cauchy}
T.~Gimse and N.~H. Risebro.
\newblock Solution of the {C}auchy problem for a conservation law with a
  discontinuous flux function.
\newblock {\em SIAM J. Math. Anal.}, 23(3):635--648, 1992.

\bibitem{HoldenHoegh}
H.~Holden, L.~Holden, and R.~H{\o}egh-Krohn.
\newblock A numerical method for first order nonlinear scalar conservation laws
  in one dimension.
\newblock {\em Comput. Math. Appl.}, 15(6-8):595--602, 1988.

\bibitem{HRT-Max:95}
H.~ Holden, N.~H. Risebro, and A.~Tveito.
\newblock Maximum principles for a class of conservation laws.
\newblock {\em SIAM J. Appl. Math.}, 55(3):651--661, 1995.

\bibitem{JohnHong:2000}
J.~M.-K. Hong.
\newblock {\em Part I: An extension of the {R}iemann problems and {G}limm's
  method to general systems of conservation laws with source terms. Part II: A
  total variation bound on the conserved quantities for a generic resonant
  nonlinear balance laws}.
\newblock PhD thesis, University of California, Davis, 2000.

\bibitem{IsaacsonTemple3}
E.~Isaacson and B.~Temple.
\newblock Convergence of the $2\times 2$ {G}odunov method for a general
  resonant nonlinear balance law.
\newblock {\em SIAM J. Appl. Math.}, 55(3):625--640, 1995.

\bibitem{KR:Rough_Diff}
K.~H. Karlsen and N.~H. Risebro.
\newblock Convergence of finite difference schemes for viscous and inviscid
  conservation laws with rough coefficients.
\newblock {\em M2N Math. Model. Numer. Anal.}, 35(2):239--270, 2001.

\bibitem{KR:Rough_Unique}
K.~H. Karlsen and N.~H. Risebro.
\newblock On the uniqueness and stability of entropy solutions of nonlinear
  degenerate parabolic equations with rough coefficients.
\newblock Preprint, {D}epartment of {M}athematics, {U}niversity of {B}ergen, 2000.

\bibitem{KR:HJsplitt}
K.~H. Karlsen and N.~H. Risebro.
\newblock Unconditionally stable methods for {H}amilton-{J}acobi equations.
\newblock {\em J. Comp. Phys.}, 180(2):710-735, 2002.

\bibitem{KRT:FDM_degen}
K.~H. Karlsen, N.~H. Risebro, and J.~D. Towers.
\newblock Upwind difference approximations for degenerate parabolic
  convection-diffusion equations with a discontinuous coefficient.
\newblock {\em IMA J. Numer. Anal.}, 2002.

\bibitem{KlausenRisebro}
R.~A. Klausen and N.~H. Risebro.
\newblock Stability of conservation laws with discontinuous coefficients.
\newblock {\em J. Differential Equations}, 157(1):41--60, 1999.

\bibitem{KlingbroII}
C.~Klingenberg and N.~H. Risebro.
\newblock Stability of a resonant system of conservation laws modeling polymer
  flow with gravitation.
\newblock {\em J. Differential Equations}, 170(2):344--380, 2001.

\bibitem{KlingbroI}
C.~Klingenberg and N.~H. Risebro.
\newblock Convex conservation laws with discontinuous coefficients.
  {E}xistence, uniqueness and asymptotic behavior.
\newblock {\em Comm. Partial Differential Equations}, 20(11-12):1959--1990, 1995.

\bibitem{KruzkovII}
S.~N. Kru{\v{z}}kov.
\newblock Results on the nature of the continuity of solutions of parabolic
  equations, and certain applications thereof.
\newblock {\em Mat. Zametki}, 6:97--108, 1969.

\bibitem{Kruzkov}
S.~N. Kru{\v{z}}kov.
\newblock First order quasi-linear equations in several independent variables.
\newblock {\em Math. USSR Sbornik}, 10(2):217--243, 1970.

\bibitem{LSU:67}
O.~A. Lady{\v{z}}enskaja, V.~A. Solonnikov, and N.~N. Ural'ceva.
\newblock {\em Linear and quasilinear equations of parabolic type}.
\newblock American Mathematical Society, Providence, R.I., 1967.

\bibitem{LTW:Comparison}
L.~W. Lin, B.~J. Temple, and J.~H. Wang.
\newblock A comparison of convergence rates for {G}odunov's method and
  {G}limm's method in resonant nonlinear systems of conservation laws.
\newblock {\em SIAM J. Numer. Anal.}, 32(3):824--840, 1995.

\bibitem{LTW:Suppression}
L.~W. Lin, B.~J. Temple, and J.~H. Wang.
\newblock Suppression of oscillations in {G}odunov's method for a resonant
  non-strictly hyperbolic system.
\newblock {\em SIAM J. Numer. Anal.}, 32(3):841--864, 1995.

\bibitem{MuratII}
F.~Murat.
\newblock Compacit\'e par compensation.
\newblock {\em Ann. Scuola Norm. Sup. Pisa Cl. Sci. (4)}, 5(3):489--507, 1978.

\bibitem{MuratI}
F.~Murat.
\newblock Compacit\'e par compensation. {I}{I}.
\newblock In {\em Proceedings of the International Meeting on Recent Methods in
  Nonlinear Analysis (Rome, 1978)}, pages 245--256, Bologna, 1979. Pitagora.

\bibitem{Murat:Hneg}
F.~Murat.
\newblock L'injection du c\^one positif de ${H}\sp{-1}$\ dans ${W}\sp{-1,\,q}$\
  est compacte pour tout $q<2$.
\newblock {\em J. Math. Pures Appl. (9)}, 60(3):309--322, 1981.

\bibitem{Oleinik:Discont}
O.~A. Ole{\u\i}nik.
\newblock Discontinuous solutions of non-linear differential equations.
\newblock {\em Amer. Math. Soc Transl. Ser. 2}, 26:95--172, 1963.

\bibitem{Quinn}
B.~K. Quinn.
\newblock Solutions with shocks: An example of an {$L_1$}-contractive
  semigroup.
\newblock {\em Comm. Pure Appl. Math.}, 24:125--132, 1971.

\bibitem{TartarI}
L.~Tartar.
\newblock Compensated compactness and applications to partial differential
  equations.
\newblock In {\em Nonlinear analysis and mechanics: Heriot-Watt Symposium, Vol.
  IV}, pages 136--212. Pitman, Boston, Mass., 1979.

\bibitem{Temple}
B.~Temple.
\newblock Global solution of the {C}auchy problem for a class of $2\times 2$\
  nonstrictly hyperbolic conservation laws.
\newblock {\em Adv. in Appl. Math.}, 3(3):335--375, 1982.

\bibitem{TowersI}
J.~D. Towers.
\newblock Convergence of a difference scheme for conservation laws with a
  discontinuous flux.
\newblock {\em SIAM J. Numer. Anal.}, 38(2):681--698 (electronic), 2000.

\bibitem{TowersII}
J.~D. Towers.
\newblock A difference scheme for conservation laws with a discontinuous flux -
  the nonconvex case.
\newblock {\em SIAM J. Numer. Anal.}, 39(4):1197--1218, 2001.

\bibitem{TveiWi:Hard}
A.~Tveito and R.~Winther.
\newblock The solution of nonstrictly hyperbolic conservation laws may be hard
  to compute.
\newblock {\em SIAM J. Sci. Comput.}, 16(2):320--329, 1995.

\bibitem{Volpert}
A.~I. Vol'pert.
\newblock The spaces {BV} and quasi-linear equations.
\newblock {\em Math. USSR Sbornik}, 2(2):225--267, 1967.

\bibitem{VolHud}
A.~I. Vol'pert and S.~I. Hudjaev.
\newblock Cauchy's problem for degenerate second order quasilinear parabolic
  equations.
\newblock {\em Math. USSR Sbornik}, 7(3):365--387, 1969.

\bibitem{Whitham}
G.~B. Whitham.
\newblock {\em Linear and nonlinear waves}.
\newblock Wiley-Interscience [John Wiley \& Sons], New York, 1974.
\newblock Pure and Applied Mathematics.

\bibitem{Yin:CC}
J.~X. Yin.
\newblock The compensated compactness method applied to quasilinear parabolic
  equations of higher order with doubly strong degeneration.
\newblock {\em Chinese Ann. Math. Ser. B}, 12(4):500--519, 1991.
\newblock A Chinese summary appears in Chinese Ann.\ Math.\ Ser.\ A {\bf 12}
  (1991), no.\ 5, 645.

\bibitem{Zhao:CC}
J.~N. Zhao.
\newblock Applications of the theory of compensated compactness to quasilinear
  degenerate parabolic equations and quasilinear degenerate elliptic equations.
\newblock {\em Northeast. Math. J.}, 2(1):33--48, 1986.

\end{thebibliography}


\end{document}