appendix : adding proof of ident results
This commit is contained in:
parent
a4cc5deec8
commit
6d6652375d
4 changed files with 128 additions and 75 deletions
|
|
@ -1,7 +1,57 @@
|
||||||
\clearpage
|
\clearpage
|
||||||
\pagenumbering{arabic}% resets `page` counter to 1
|
\pagenumbering{arabic}% resets `page` counter to 1
|
||||||
\renewcommand*{\thepage}{A-\arabic{page}}
|
\renewcommand*{\thepage}{S-\arabic{page}}
|
||||||
\appendix
|
\appendix
|
||||||
|
|
||||||
|
\chapter{Supplementary for~\nameref{chap:struct-detection}}
|
||||||
|
\section{Proof of the idenfiability result}
|
||||||
|
\label{sec:proof-identifiability}
|
||||||
|
|
||||||
|
We recall the following
|
||||||
|
\def\thetheorem{\ref{thm:identifiability-iid}}
|
||||||
|
\begin{theorem}[Identifiability of $iid$-colBiSBM]
|
||||||
|
The parameters $(\bm{\pi}, \bm{\rho}, \bm{\alpha})$ are
|
||||||
|
identifiable up to a label switching of the blocks if those
|
||||||
|
conditions are achieved:
|
||||||
|
\begin{itemize}
|
||||||
|
\item[(1.1)] $\exists m^*\in\{1,\dots,M\} : n^1_{m^*} \geq 2 Q_2 - 1~\text{and}~n^2_{m^*} \geq 2 Q_1 - 1$.
|
||||||
|
\item[(1.2)] $\forall 1\leq q \leq Q_1, \pi_q > 0$
|
||||||
|
and the coordinates of vector $\bm{\rho}
|
||||||
|
{X^{m^*}}^T$ are distinct (where ${X^{m^*}}^T$ is the transpose of $X^{m^*}$).
|
||||||
|
\item[(1.3)] $\forall 1\leq r \leq Q_2, \rho_r > 0$
|
||||||
|
and the coordinates of vector $\bm{\pi}
|
||||||
|
X^{m^*}$ are distinct.
|
||||||
|
\end{itemize}
|
||||||
|
\end{theorem}
|
||||||
|
\begin{proof}
|
||||||
|
Following the tracks of~\cite{chabert-liddellLearningCommonStructures2024a}
|
||||||
|
we derive the result in Properties~\ref{thm:identifiability-iid}.
|
||||||
|
|
||||||
|
\cite{keribinEstimationSelectionLatent2015} building
|
||||||
|
on~\cite{celisseConsistencyMaximumlikelihoodVariational2012}, proved that the
|
||||||
|
parameters $(\bm{\pi}, \bm{\rho}, \bm{\alpha})$ of the
|
||||||
|
$\mathcal{F}\text{-BiSBM}_{n_1^m,n_2^m}(Q_1^m, Q_2^m, \bm{\pi^m}, \bm{\rho^m}, \bm{\alpha^m})$
|
||||||
|
are identifiable from the observation of network $X^m$ when $\mathcal{F}$
|
||||||
|
is the Bernoulli distribution and the following conditions are met:
|
||||||
|
\begin{enumerate}
|
||||||
|
\item $ n_1^m \geq 2 Q_2^m - 1~\text{and}~n_2^m \geq 2 Q_1^m - 1$.
|
||||||
|
\item $\forall 1\leq q \leq Q_1^m, \pi_q^m > 0$
|
||||||
|
and the coordinates of vector $\bm{\rho^m}
|
||||||
|
{X^{m^*}}^T$ are distinct (where ${X^{m^*}}^T$ is the transpose of $X^{m^*}$).
|
||||||
|
\item $\forall 1\leq r \leq Q_2^m, \rho_r^m > 0$
|
||||||
|
and the coordinates of vector $\bm{\pi^m}
|
||||||
|
X^{m^*}$ are distinct.
|
||||||
|
\end{enumerate}
|
||||||
|
|
||||||
|
Under the \emph{iid}-colBiSBM model, for all $m=1\dots M$,
|
||||||
|
$X^m \sim \mathcal{F}\text{-BiSBM}_{n_1^m,n_2^m}(Q_1, Q_2,
|
||||||
|
\bm{\pi}, \bm{\rho}, \bm{\alpha})$. This means that
|
||||||
|
following~\cite{keribinEstimationSelectionLatent2015}, the
|
||||||
|
identifiability of $\bm{\alpha}$, $\bm{\pi}$ and $\bm{\rho}$ is obtained
|
||||||
|
from the distribution of $X^{m^*}$ under assumptions (1.1), (1.2) and
|
||||||
|
(1.3).
|
||||||
|
\end{proof}
|
||||||
|
|
||||||
\chapter{Supplementary for~\nameref{chap:simulation-studies}}
|
\chapter{Supplementary for~\nameref{chap:simulation-studies}}
|
||||||
Below are the supplementary material for the~\nameref{chap:simulation-studies}.
|
Below are the supplementary material for the~\nameref{chap:simulation-studies}.
|
||||||
|
|
||||||
|
|
@ -31,14 +81,18 @@ Please note that blank space indicates that among all conditions
|
||||||
the corresponding model was not selected at all.
|
the corresponding model was not selected at all.
|
||||||
|
|
||||||
\begin{landscape}
|
\begin{landscape}
|
||||||
\pagestyle{empty}
|
|
||||||
\input{../tables/simulations/model_selection/model-selection.tex}
|
\input{../tables/simulations/model_selection/model-selection.tex}
|
||||||
\end{landscape}
|
\end{landscape}
|
||||||
\pagestyle{fancy}
|
|
||||||
|
|
||||||
|
|
||||||
\chapter{Supplementary for~\nameref{chap:applications-ecological-networks}}
|
\chapter{Supplementary for~\nameref{chap:applications-ecological-networks}}
|
||||||
\section{Additional information on~\nameref{sec:baldock-clustering}}
|
\section{Additional information on~\nameref{sec:baldock-clustering}}
|
||||||
|
|
||||||
|
\fancypagestyle{fancy}
|
||||||
|
|
||||||
|
\renewcommand*{\thepage}{S-\arabic{page}}
|
||||||
|
|
||||||
Due to report size limitations we included these plots here as they are not crucial to understand what is going on in
|
Due to report size limitations we included these plots here as they are not crucial to understand what is going on in
|
||||||
the section~\ref{sec:baldock-clustering}.
|
the section~\ref{sec:baldock-clustering}.
|
||||||
Yet they are useful to confirm the explanation given.
|
Yet they are useful to confirm the explanation given.
|
||||||
|
|
|
||||||
|
|
@ -1,5 +1,6 @@
|
||||||
\addtocounter{customchapter}{1}
|
\addtocounter{customchapter}{1}
|
||||||
\chapter[Structure detection in bipartite collection]{Structure detection in a collection of bipartite networks}
|
\chapter[Structure detection in bipartite collection]{Structure detection in a collection of bipartite networks}
|
||||||
|
\label{chap:struct-detection}
|
||||||
\section{Definition of a collection}
|
\section{Definition of a collection}
|
||||||
\label{sec:definition-of-a-collection}
|
\label{sec:definition-of-a-collection}
|
||||||
|
|
||||||
|
|
@ -708,7 +709,7 @@ And the pairwise dissimilarity for networks $(m,m')\in\mathcal{M}^2$ is then:
|
||||||
|
|
||||||
\begin{figure}[t]
|
\begin{figure}[t]
|
||||||
\centering
|
\centering
|
||||||
\begin{tikzpicture}
|
\begin{tikzpicture}[scale=0.7]
|
||||||
\tikzstyle{instruct}=[font=\small, text justified, rectangle,draw,fill=yellow!50]
|
\tikzstyle{instruct}=[font=\small, text justified, rectangle,draw,fill=yellow!50]
|
||||||
\tikzstyle{first_col}=[rectangle, text justified, draw,fill=gray!50]
|
\tikzstyle{first_col}=[rectangle, text justified, draw,fill=gray!50]
|
||||||
\tikzstyle{second_col}=[scale=0.55, circle, draw,fill=red!50]
|
\tikzstyle{second_col}=[scale=0.55, circle, draw,fill=red!50]
|
||||||
|
|
@ -751,12 +752,10 @@ trivial partition in a unique group.
|
||||||
Then using the \emph{Kmeans} we split the collection in two sub-collections
|
Then using the \emph{Kmeans} we split the collection in two sub-collections
|
||||||
with the dissimilarity matrix. The two sub-collections are fitted and we
|
with the dissimilarity matrix. The two sub-collections are fitted and we
|
||||||
compute the score of this new partition $\mathcal{G}^{*} = \{G_1, G_2\}$.
|
compute the score of this new partition $\mathcal{G}^{*} = \{G_1, G_2\}$.
|
||||||
|
|
||||||
If $Sc(\mathcal{G}^{*}) > Sc(\mathcal{G})$ then we repeat the same procedure on
|
If $Sc(\mathcal{G}^{*}) > Sc(\mathcal{G})$ then we repeat the same procedure on
|
||||||
$G_1$ and $G_2$. Else we return $\mathcal{G}$.
|
$G_1$ and $G_2$. Else we return $\mathcal{G}$.
|
||||||
|
|
||||||
We illustrate our capacity to perform a partition of a collection for all
|
We illustrate our capacity to perform a partition of a collection for all
|
||||||
colBiSBM models in %\ref{sec:network-clustering-of-simulated-networks}.
|
colBiSBM models in~\ref{sec:network-clustering-of-simulated-networks}.
|
||||||
|
|
||||||
\section{Model identifiability}
|
\section{Model identifiability}
|
||||||
\label{sec:model-identifiability}
|
\label{sec:model-identifiability}
|
||||||
|
|
@ -764,7 +763,7 @@ colBiSBM models in %\ref{sec:network-clustering-of-simulated-networks}.
|
||||||
The goal here is to prove that if $\ell(\bm{X};\bm{\theta}) = \ell(\bm{X};\bm{\theta}')$ for any collection $\bm{X}$ then $\bm{\theta} = \bm{\theta}'$.
|
The goal here is to prove that if $\ell(\bm{X};\bm{\theta}) = \ell(\bm{X};\bm{\theta}')$ for any collection $\bm{X}$ then $\bm{\theta} = \bm{\theta}'$.
|
||||||
|
|
||||||
Following the proof proposed by~\cite{chabert-liddellLearningCommonStructures2024a}, that adapted it to the collection case and~\cite{keribinEstimationSelectionLatent2015} that extended the result of~\cite{celisseConsistencyMaximumlikelihoodVariational2012} to the LBM Bernoulli model,
|
Following the proof proposed by~\cite{chabert-liddellLearningCommonStructures2024a}, that adapted it to the collection case and~\cite{keribinEstimationSelectionLatent2015} that extended the result of~\cite{celisseConsistencyMaximumlikelihoodVariational2012} to the LBM Bernoulli model,
|
||||||
we obtain the following proof of identifiability for the $iid$-colBiSBM:
|
we obtain the following result of identifiability\footnote{The proof is in appendix. \ref{sec:proof-identifiability}} for the $iid$-colBiSBM:
|
||||||
\begin{theorem}[Identifiability of $iid$-colBiSBM]
|
\begin{theorem}[Identifiability of $iid$-colBiSBM]
|
||||||
\label{thm:identifiability-iid}
|
\label{thm:identifiability-iid}
|
||||||
The parameters $(\bm{\pi}, \bm{\rho}, \bm{\alpha})$ are
|
The parameters $(\bm{\pi}, \bm{\rho}, \bm{\alpha})$ are
|
||||||
|
|
|
||||||
Binary file not shown.
|
|
@ -26,7 +26,7 @@
|
||||||
hypertexnames=true
|
hypertexnames=true
|
||||||
}
|
}
|
||||||
|
|
||||||
\newtheorem{theorem}{Theorem}
|
\newtheorem{theorem}{Properties}
|
||||||
\usepackage{tocbibind} % Pour avoir des index pour table des matières, biblio
|
\usepackage{tocbibind} % Pour avoir des index pour table des matières, biblio
|
||||||
\usepackage{geometry}
|
\usepackage{geometry}
|
||||||
\geometry{bmargin=25mm}
|
\geometry{bmargin=25mm}
|
||||||
|
|
|
||||||
Loading…
Add table
Reference in a new issue