submitted version

This commit is contained in:
Pierre-Francois Loos 2020-01-02 12:39:15 +01:00
parent 551d7d9f74
commit 5d65e110c6
5 changed files with 1349 additions and 759 deletions

1791
JPCL.nb

File diff suppressed because it is too large Load Diff

View File

@ -1,7 +1,7 @@
%% This BibTeX bibliography file was created using BibDesk.
%% http://bibdesk.sourceforge.net/
%% Created for Pierre-Francois Loos at 2019-11-19 20:03:52 +0100
%% Created for Pierre-Francois Loos at 2020-01-02 11:03:42 +0100
%% Saved with string encoding Unicode (UTF-8)
@ -82,6 +82,39 @@
@string{theo = {J. Mol. Struct. (THEOCHEM)}}
@article{Hod19b,
Author = {Manuel Hodecker and Dirk R. Rehn and Patrick Norman and Andreas Dreuw},
Date-Added = {2020-01-02 11:03:38 +0100},
Date-Modified = {2020-01-02 11:03:38 +0100},
Doi = {10.1063/1.5081665},
Journal = {J. Chem. Phys.},
Pages = {174105},
Title = {Algebraic-Diagrammatic Construction Scheme for the Polarization Propagator Including Ground-State Coupled-Cluster Amplitudes. II. Static Polarizabilities},
Volume = {150},
Year = {2019},
Bdsk-Url-1 = {https://doi.org/10.1063/1.5081663}}
@article{Hod19a,
Author = {Manuel Hodecker and Adrian L. Dempwolff and Dirk R. Rehn and Andreas Dreuw},
Date-Added = {2020-01-02 11:03:35 +0100},
Date-Modified = {2020-01-02 11:03:35 +0100},
Doi = {10.1063/1.5081663},
Journal = {J. Chem. Phys.},
Pages = {174104},
Title = {Algebraic-diagrammatic construction scheme for the polarization propagator including ground-state coupled-cluster amplitudes. I. Excitation energies},
Volume = {150},
Year = {2019},
Bdsk-Url-1 = {https://doi.org/10.1063/1.5081663}}
@article{Loo20a,
Author = {P. F. Loos and D. Jacquemin},
Date-Added = {2020-01-02 11:01:16 +0100},
Date-Modified = {2020-01-02 11:01:48 +0100},
Journal = {J. Phys. Chem. Lett.},
Title = {Is ADC(3) as Accurate as CC3 for Valence and Rydberg Transition Energies?},
Volume = {in press},
Year = {2020}}
@article{Odd78,
Author = {J. Oddershede},
Date-Added = {2019-11-19 19:58:44 +0100},
@ -725,7 +758,7 @@
Doi = {10.1080/00268976.2015.1119901},
Journal = {Mol. Phys.},
Pages = {957--967},
Title = {Assessment Of The Convergence Of Partially Self-Consistent {{BSE/GW}} Calculations},
Title = {Assessment of the Convergence of Partially Self-Consistent {{BSE/GW}} Calculations},
Volume = {114},
Year = {2016},
Bdsk-Url-1 = {https://doi.org/10.1080/00268976.2015.1119901}}
@ -1260,7 +1293,7 @@
Doi = {10.1063/1.1676398},
Journal = {J. Chem. Phys.},
Pages = {2236},
Title = {SelfConsistent Molecular Orbital Methods. X. Molecular Orbital Studies of Excited States with Minimal and Extended Basis Sets},
Title = {Self-Consistent Molecular Orbital Methods. X. Molecular Orbital Studies of Excited States with Minimal and Extended Basis Sets},
Volume = {55},
Year = {1971},
Bdsk-Url-1 = {https://doi.org/10.1063/1.1676398}}
@ -1600,7 +1633,7 @@
Month = jun,
Number = {23},
Pages = {10252--10264},
Title = {Introduction of {\emph{n}} -Electron Valence States for Multireference Perturbation Theory},
Title = {Introduction of {\emph{N}}-Electron Valence States for Multireference Perturbation Theory},
Volume = {114},
Year = {2001},
Bdsk-Url-1 = {https://doi.org/10.1063/1.1361246}}

View File

@ -1,27 +1,47 @@
\documentclass[aip,jcp,reprint,noshowkeys,superscriptaddress]{revtex4-1}
\usepackage{graphicx,dcolumn,bm,xcolor,microtype,multirow,amscd,amsmath,amssymb,amsfonts,physics,mhchem,longtable,pifont,wrapfig,multirow}
\newif\ifpreprint
%Preprint/reprint switch
%\preprinttrue % Enable for single column preprint
\preprintfalse % Enable for double column reprint
\usepackage[T1]{fontenc}
\ifpreprint
\documentclass[journal=jpclcd,manuscript=letter]{achemso}
\else
\documentclass[journal=jpclcd,manuscript=letter,layout=twocolumn]{achemso}
\fi
\usepackage[T1]{fontenc} % Use modern font encodings
\usepackage{amsmath}
\usepackage{newtxtext,newtxmath}
\usepackage{natbib}
\bibliographystyle{achemso}
\usepackage[
colorlinks=true,
citecolor=blue,
breaklinks=true
]{hyperref}
\urlstyle{same}
\usepackage{pifont}
\usepackage{graphicx}
\usepackage{dcolumn}
\usepackage{braket}
\usepackage{multirow}
\usepackage{threeparttable}
\usepackage{xspace}
\usepackage{verbatim}
\usepackage[version=4]{mhchem} % Formula subscripts using \ce{}
\usepackage{comment}
\usepackage{color,soul}
\newcommand{\alert}[1]{\textcolor{red}{#1}}
\usepackage[normalem]{ulem}
\newcommand{\titou}[1]{\textcolor{red}{#1}}
\newcommand{\denis}[1]{\textcolor{purple}{#1}}
\newcommand{\toto}[1]{\textcolor{brown}{#1}}
\newcommand{\trashPFL}[1]{\textcolor{red}{\sout{#1}}}
\newcommand{\trashDJ}[1]{\textcolor{purple}{\sout{#1}}}
\newcommand{\trashAS}[1]{\textcolor{brown}{\sout{#1}}}
\usepackage{mathtools}
\usepackage[dvipsnames]{xcolor}
\usepackage{xspace}
\usepackage{ifthen}
\usepackage{qcircuit}
\usepackage{graphicx,longtable,dcolumn,mhchem}
\usepackage{rotating,color}
\usepackage{lscape}
\usepackage{amsmath}
\usepackage{dsfont}
\usepackage{soul}
\usepackage{physics}
\newcommand{\cmark}{\color{green}{\text{\ding{51}}}}
\newcommand{\xmark}{\color{red}{\text{\ding{55}}}}
@ -48,44 +68,128 @@
\newcommand{\SetB}{QUEST\#2}
\newcommand{\SetC}{QUEST\#3}
\usepackage[colorlinks = true,
linkcolor = blue,
urlcolor = black,
citecolor = blue,
anchorcolor = black]{hyperref}
\definecolor{goodorange}{RGB}{225,125,0}
\definecolor{goodgreen}{RGB}{5,130,5}
\definecolor{goodred}{RGB}{220,50,25}
\definecolor{goodblue}{RGB}{30,144,255}
\newcommand{\note}[2]{
\ifthenelse{\equal{#1}{F}}{
\colorbox{goodorange}{\textcolor{white}{\footnotesize \fontfamily{phv}\selectfont #1}}
\textcolor{goodorange}{{\footnotesize \fontfamily{phv}\selectfont #2}}\xspace
}{}
\ifthenelse{\equal{#1}{R}}{
\colorbox{goodred}{\textcolor{white}{\footnotesize \fontfamily{phv}\selectfont #1}}
\textcolor{goodred}{{\footnotesize \fontfamily{phv}\selectfont #2}}\xspace
}{}
\ifthenelse{\equal{#1}{N}}{
\colorbox{goodgreen}{\textcolor{white}{\footnotesize \fontfamily{phv}\selectfont #1}}
\textcolor{goodgreen}{{\footnotesize \fontfamily{phv}\selectfont #2}}\xspace
}{}
\ifthenelse{\equal{#1}{M}}{
\colorbox{goodblue}{\textcolor{white}{\footnotesize \fontfamily{phv}\selectfont #1}}
\textcolor{goodblue}{{\footnotesize \fontfamily{phv}\selectfont #2}}\xspace
}{}
}
\usepackage{titlesec}
%\usepackage{footnote}
%
\let\titlefont\undefined
\usepackage[fontsize=11pt]{scrextend}
\captionsetup{font={sf,footnotesize}}
%
\titleformat{\section}
{\normalfont\sffamily\bfseries\color{Blue}}
{\thesection.}{0.25em}{\uppercase}
\titleformat{\subsection}[runin]
{\normalfont\sffamily\bfseries}
{\thesubsection}{0.25em}{}[.\;\;]
\titleformat{\suppinfo}
{\normalfont\sffamily\bfseries}
{\thesubsection}{0.25em}{}
\titlespacing*{\section}{0pt}{0.5\baselineskip}{0.01\baselineskip}
\titlespacing*{\subsection}{0pt}{0.125\baselineskip}{0.01\baselineskip}
\renewcommand{\refname}{\normalfont\sffamily\bfseries\color{Blue}{\normalsize REFERENCES}}
\setlength{\bibsep}{0pt plus 0.3ex}
\author{Pierre-Fran\c{c}ois Loos}
\email{loos@irsamc.ups-tlse.fr}
\affiliation[LCPQ, Toulouse]{Laboratoire de Chimie et Physique Quantiques, Universit\'e de Toulouse, CNRS, UPS, France}
\author{Anthony Scemama}
\affiliation[LCPQ, Toulouse]{Laboratoire de Chimie et Physique Quantiques, Universit\'e de Toulouse, CNRS, UPS, France}
\author{Denis Jacquemin}
\email{Denis.Jacquemin@univ-nantes.fr}
\affiliation[CEISAM, Nantes]{Universit\'e de Nantes, CNRS, CEISAM UMR 6230, F-44000 Nantes, France}
\let\oldmaketitle\maketitle
\let\maketitle\relax
\title{The Quest For Highly Accurate Excitation Energies: A Computational Perspective}
\date{\today}
\begin{tocentry}
\vspace{1cm}
\includegraphics[width=\textwidth]{TOC}
\end{tocentry}
\newcommand{\LCPQ}{Laboratoire de Chimie et Physique Quantiques, Universit\'e de Toulouse, CNRS, UPS, France}
\newcommand{\CEISAM}{Laboratoire CEISAM - UMR CNRS 6230, Universit\'e de Nantes, 2 Rue de la Houssini\`ere, BP 92208, 44322 Nantes Cedex 3, France}
\begin{document}
\title{The Quest For Highly Accurate Excitation Energies: A Computational Perspective}
\ifpreprint
\else
\twocolumn[
\begin{@twocolumnfalse}
\fi
\oldmaketitle
\author{Pierre-Fran\c{c}ois \surname{Loos}}
\email{loos@irsamc.ups-tlse.fr}
\affiliation{\LCPQ}
\author{Anthony \surname{Scemama}}
\affiliation{\LCPQ}
\author{Denis \surname{Jacquemin}}
\email[Corresponding author: ]{Denis.Jacquemin@univ-nantes.fr}
\affiliation{\CEISAM}
%%%%%%%%%%%%%%%%
%%% ABSTRACT %%%
%%%%%%%%%%%%%%%%
\begin{abstract}
\begin{wrapfigure}[15]{o}[-1.25cm]{0.4\linewidth}
\centering
\includegraphics[width=\linewidth]{TOC}
\end{wrapfigure}
We provide a personal overview of the successive steps that made possible to obtain increasingly accurate excitation energies and properties with computational chemistry tools, eventually leading to chemically accurate vertical transition energies for small- and
medium-size molecules. First, we describe the evolution of \textit{ab initio} state-of-the-art methods employed to define benchmark values, with originally Roos' CASPT2 method, and then third-order coupled cluster methods as in the renowned Thiel set of excitation
energies described in a remarkable series of papers in the 2000's. More recently, this quest for highly accurate excitation energies was reinitiated thanks to the resurgence of selected configuration interaction (SCI) methods and their efficient parallel implementation.
These methods have been able to routinely deliver highly accurate excitation energies for small molecules, as well as medium-size molecules with compact basis sets, for both single and double excitations. Second, we describe how these high-level methods
and the creation of large, diverse, and accurate benchmark sets of excitation energies have allowed to assess fairly and accurately the performance of computationally lighter theoretical models (\eg, TD-DFT, BSE, ADC, EOM-CC, etc.) for different types of
excited states ($\pi \ra \pi^*$, $n \ra \pi^*$, valence, Rydberg, singlet, triplet, double excitation, etc). We conclude this \textit{Perspective} by discussing the current potentiality of these methods from both an expert and a non-expert points of view, and what we
We provide an overview of the successive steps that made possible to obtain increasingly accurate excitation energies and properties with computational chemistry tools, eventually leading to chemically accurate vertical transition
energies for small- and medium-size molecules. First, we describe the evolution of \textit{ab initio} state-of-the-art methods employed to define benchmark values, with originally Roos' CASPT2 method, and then third-order
coupled cluster (CC3) methods as in the renowned Thiel set of vertical excitation energies described in a remarkable series of papers in the 2000's. More recently, this quest for highly accurate excitation energies was reinitiated
thanks to the resurgence of selected configuration interaction (SCI) methods and their efficient parallel implementation. These methods have been able to routinely deliver highly accurate excitation energies for small molecules,
as well as medium-size molecules with compact basis sets, for both single and double excitations. Second, we describe how these high-level methods and the creation of large, diverse, and accurate benchmark sets of excitation
energies have allowed to assess fairly and accurately the performance of computationally lighter theoretical models (\eg, TD-DFT, BSE@\textit{GW}, ADC, EOM-CC, etc.) for different types of excited states ($\pi \rightarrow \pi^*$,
$n \rightarrow \pi^*$, valence, Rydberg, singlet, triplet, double excitation, etc). We conclude this \textit{Perspective} by discussing the current potentiality of these methods from both an expert and a non-expert points of view, and what we
believe could be the future theoretical and technological developments in the field.
\end{abstract}
\maketitle
\ifpreprint
\else
\end{@twocolumnfalse}
]
\fi
\ifpreprint
\else
\small
\fi
\noindent
%%%%%%%%%%%%%%%%%%%%
%%% INTRODUCTION %%%
%%%%%%%%%%%%%%%%%%%%
The accurate modeling of excited-state properties with \textit{ab initio} quantum chemistry methods is a challenging yet self-proclaimed ambition of the electronic structure theory community that will certainly keep us busy for (at the very least) the next few decades to come
(see, for example, Refs.~\onlinecite{Dre05,Gon12,Gho18} and references therein). Of particular interest is the access to precise excitation energies, \ie, the energy difference between ground and excited electronic states, and their intimate link with photophysical and
(see, for example, Refs.~\citenum{Dre05,Gon12,Gho18} and references therein). Of particular interest is the access to precise excitation energies, \ie, the energy difference between ground and excited electronic states, and their intimate link with photophysical and
photochemical processes. The factors that makes this quest for high accuracy particularly delicate are very diverse.
First of all (and maybe surprisingly), it is, in most cases, tricky to obtain reliable and accurate experimental data that one can straightforwardly compare to theoretical values. In the case of vertical excitation energies, \ie, excitation energies at a fixed geometry, band maxima
@ -93,7 +197,7 @@ do not usually correspond to theoretical values as one needs to take into accoun
assignment could be made. For a more faithful comparison between theory and experiment, although more computationally demanding, the so-called 0-0 energies are definitely a safer playground. \cite{Die04b,Win13,Fan14b,Loo19b}
Second, developing theories suited for excited states is usually more complex and costly than their ground-state equivalent, as one might lack a proper variational principle for excited-state energies.
As a consequence, for a given level of theory, excited-state methods are usually less accurate than their ground-state counterpart.
As a consequence, for a given level of theory, excited-state methods are usually less accurate than their ground-state counterpart, potentially creating a ground-state bias that leads to inaccurate excitation energies.
Another feature that makes excited states particularly fascinating and challenging is that they can be both extremely close in energy from each other and have very different natures ($\pi \ra \pi^*$, $n \ra \pi^*$, charge transfer, double excitation, valence, Rydberg, singlet,
triplet, etc). Therefore, it would be highly desirable to possess a computational method (or protocol) that provides a balanced treatment of the entire ``spectrum'' of excited states.
@ -105,18 +209,18 @@ Let us not forget about the requirements of minimal user input and minimal chemi
respect to system size and small memory footprint cannot be disregarded. Although the simultaneous fulfillment of all these requirements seems elusive, it is useful to keep these criteria in mind. Table \ref{tab:method} is here for fulfill such a purpose.
%%% TABLE I %%%
%\begin{squeezetable}
\begin{table}
\footnotesize
\caption{Formal computational scaling of various excited-state methods with respect to the number of one-electron basis functions $N$ and the accessibility of various key properties in popular computational software packages.
The typical error range of estimate for single excitations is also provided as a very rough indicator of the method accuracy.}
The typical error range for single excitations is also provided as a qualitative indicator of the method accuracy.}
\label{tab:method}
\begin{ruledtabular}
\begin{tabular}{lcccc}
\begin{tabular}{p{2.1cm}cccc}
\hline
\mr{2}{*}{Method} & Formal & Oscillator & Analytical & Typical \\
& scaling & strength & gradients & error (eV) \\
\hline
TD-DFT & $N^4$ & \cmark & \cmark & $0.2$--$0.4$ \\
BSE@\emph{GW} & $N^4$ & \cmark & \xmark & $0.1$--$0.3$ \\
BSE@\textit{GW} & $N^4$ & \cmark & \xmark & $0.1$--$0.3$ \\
\\
CIS & $N^5$ & \cmark & \cmark & $\sim 1.0$ \\
CIS(D) & $N^5$ & \xmark & \cmark & $0.2$--$0.3$ \\
@ -131,19 +235,18 @@ The typical error range of estimate for single excitations is also provided as a
EOM-CCSDT & $N^8$ & \xmark & \xmark & $\sim 0.03$ \\
EOM-CCSDTQ & $N^{10}$ & \xmark & \xmark & $\sim 0.01$ \\
\\
CASPT2 or NEVPT2 & $N!$ & \cmark & \cmark & $0.1$--$0.2$ \\
CASPT2/NEVPT2 & $N!$ & \cmark & \cmark & $0.1$--$0.2$ \\
SCI & $N!$ & \xmark & \xmark & $\sim 0.03$ \\
FCI & $N!$ & \cmark & \cmark & $0.0$ \\
\hline
\end{tabular}
\end{ruledtabular}
\end{table}
%\end{squeezetable}
%**************
%** HISTORY **%
%**************
Before detailing some key past and present contributions aiming at obtaining highly accurate excitation energies, we start by giving a historical overview of the various excited-state \textit{ab initio} methods that have emerged in the last fifty years.
Interestingly, for pretty much every single method, the theory was derived much earlier than their actual implementation in electronic structure software packages and the same applies to the analytical gradients when they are available.
Interestingly, for pretty much every single method, the theory was derived much earlier than their actual implementation in electronic structure software packages and the same applies to the analytical gradients when available.
%%%%%%%%%%%%%%%%%%%%%
%%% POPLE'S GROUP %%%
@ -160,12 +263,12 @@ This second-order correction greatly reduces the magnitude of the error compared
In the early 1990's, the complete-active-space self-consistent field (CASSCF) method \cite{And90} and its second-order perturbation-corrected variant CASPT2 \cite{And92} (both originally developed in Roos' group) appeared.
This was a real breakthrough.
Although it took more than ten years to obtain analytical gradients, \cite{Cel03} CASPT2 was probably the first method that could provide quantitative results for molecular excited states of genuine photochemical interest. \cite{Roo96}
Nonetheless, it is common knowledge that CASPT2 has the clear tendency of underestimating vertical excitation energies in organic molecules.
Nonetheless, it is of common knowledge that CASPT2 has the clear tendency of underestimating vertical excitation energies in organic molecules.
Driven by Angeli and Malrieu, \cite{Ang01} the creation of the second-order $n$-electron valence state perturbation theory (NEVPT2) method several years later was able to cure some of the main theoretical deficiencies of CASPT2.
For example, NEVPT2 is known to be intruder state free and size consistent.
The limited applicability of these multiconfigurational methods is mainly due to the need of carefully defining an active space based on the desired transition(s) in order to obtain meaningful results, as well as their factorial computational growth with the number of active electrons and orbitals.
We also point out that some emergent approaches, like DMRG (density matrix renormalization group), \cite{Bai19} also offer a new path for the development of these multiconfigurational theories.
With a typical minimal valence active space tailored for the desired transitions, the usual error with CASPT2 or NEVPT2 calculations is $0.1$--$0.2$ eV.
We also point out that some emergent approaches, like DMRG (density matrix renormalization group), \cite{Bai19} offer a new path for the development of these multiconfigurational methods.
%%%%%%%%%%%%%
%%% TDDFT %%%
@ -199,23 +302,23 @@ It is also noteworthy that CCSDT and CC3 are also able to detect the presence of
%%%%%%%%%%%%%%%%%%%
It is also important to mention the recent rejuvenation of the second- and third-order algebraic diagrammatic construction [ADC(2) \cite{Sch82} and ADC(3) \cite{Tro99,Har14}] methods that scale as $N^5$ and $N^6$, respectively.
These methods are related to the older second- and third-order polarization propagator approaches (SOPPA and TOPPA). \cite{Odd78,Pac96}
This renaissance was certainly initiated by the enormous amount of work invested by Dreuw's group in order to provide a fast and efficient implementation of these methods, \cite{Dre15} including the analytical gradients, \cite{Reh19} as well as other interesting variants.
This renaissance was certainly initiated by the enormous amount of work invested by Dreuw's group in order to provide a fast and efficient implementation of these methods, \cite{Dre15} including the analytical gradients, \cite{Reh19} as well as other interesting variants. \cite{Dre15,Hod19a}
These Green's function one-electron propagator techniques indeed represent valuable alternatives thanks to their reduced cost compared to their CC equivalents.
In that regard, ADC(2) is particularly attractive with an error around $0.1$--$0.2$ eV.
However, we have recently observed that ADC(3) generally overcorrects the ADC(2) excitation energies and is significantly less accurate than CC3. \cite{Tro02,Loo18a,Loo20}
However, we have recently observed that ADC(3) generally overcorrects the ADC(2) excitation energies and is significantly less accurate than CC3. \cite{Tro02,Loo18a,Loo20,Loo20a}
%%%%%%%%%%%%%%
%%% BSE@GW %%%
%%%%%%%%%%%%%%
Finally, let us mention the many-body Green's function Bethe-Salpeter equation (BSE) formalism \cite{Str88} (which is usually performed on top of a \emph{GW} calculation). \cite{Hed65}
Finally, let us mention the many-body Green's function Bethe-Salpeter equation (BSE) formalism \cite{Str88} (which is usually performed on top of a \textit{GW} calculation). \cite{Hed65}
BSE has gained momentum in the past few years and is a serious candidate as a computationally inexpensive electronic structure theory method that can effectively model excited states with a typical error of $0.1$--$0.3$ eV, as well as some related properties. \cite{Jac17b,Bla18}
One of the main advantage of BSE compared to TD-DFT (with a similar computational cost) is that it allows a faithful description of charge-transfer states and, when performed on top of a (partially) self-consistently \emph{GW} calculation, BSE@\emph{GW} has been shown to be weakly dependent on its starting point (\ie, on the functional selected for the underlying DFT calculation). \cite{Jac16,Gui18}
One of the main advantage of BSE compared to TD-DFT (with a similar computational cost) is that it allows a faithful description of charge-transfer states and, when performed on top of a (partially) self-consistently \textit{GW} calculation, BSE@\textit{GW} has been shown to be weakly dependent on its starting point (\ie, on the functional selected for the underlying DFT calculation). \cite{Jac16,Gui18}
However, due to the adiabatic (\ie, static) approximation, doubly excited states are completely absent from the BSE spectrum.
%%%%%%%%%%%%%%%%%%%
%%% SCI METHODS %%%
%%%%%%%%%%%%%%%%%%%
In the past five years, \cite{Gin13,Gin15} we have witnessed a resurgence of the so-called selected CI (SCI) methods \cite{Ben69,Whi69,Hur73} thanks to the development and implementation of new, fast, and efficient algorithms to select cleverly determinants in the full CI (FCI) space (see Refs.~\onlinecite{Gar18,Gar19} and references therein).
In the past five years, \cite{Gin13,Gin15} we have witnessed a resurgence of the so-called selected CI (SCI) methods \cite{Ben69,Whi69,Hur73} thanks to the development and implementation of new, fast, and efficient algorithms to select cleverly determinants in the full CI (FCI) space (see Refs.~\citenum{Gar18,Gar19} and references therein).
SCI methods rely on the same principle as the usual CI approach, except that determinants are not chosen \textit{a priori} based on occupation or excitation criteria but selected among the entire set of determinants based on their estimated contribution to the FCI wave function or energy.
Indeed, it has been noticed long ago that, even inside a predefined subspace of determinants, only a small number of them significantly contributes.
The main advantage of SCI methods is that no \textit{a priori} assumption is made on the type of electron correlation.
@ -231,7 +334,7 @@ For someone who has never worked with SCI methods, it might be surprising to see
This is mainly due to some specific choices in terms of implementation as explained below.
Indeed, to keep up with Moore's ``Law'' in the early 2000's, the processor designers had no other choice than to propose multi-core chips to avoid an explosion of the energy requirements.
Increasing the number of floating-point operations per second by doubling the number of CPU cores only requires to double the required energy, while doubling the frequency multiplies the required energy by a factor of $\sim$ 8.
This bifurcation in hardware design implied a \emph{change of paradigm} \cite{Sut05} in the implementation and design of computational algorithms. A large degree of parallelism is now required to benefit from a significant acceleration.
This bifurcation in hardware design implied a \textit{change of paradigm} \cite{Sut05} in the implementation and design of computational algorithms. A large degree of parallelism is now required to benefit from a significant acceleration.
Fifteen years later, the community has made a significant effort to redesign the methods with parallel-friendly algorithms. \cite{Val10,Cle10,Gar17b,Pen16,Kri13,Sce13}
In particular, the change of paradigm to reach FCI accuracy with SCI methods came
from the use of determinant-driven algorithms which were considered for long as inefficient
@ -252,7 +355,7 @@ In summary, each method has its own strengths and weaknesses, and none of them i
%%% FIG 1 %%%
\begin{figure*}
\includegraphics[width=\linewidth]{Set1}
\caption{Mean absolute error (in eV) with respect to the TBE/\emph{aug}-cc-pVTZ values from the {\SetA} set (as described in Ref.~\onlinecite{Loo18a}) for various methods and types of excited states.
\caption{Mean absolute error (in eV) with respect to the TBE/\textit{aug}-cc-pVTZ values from the {\SetA} set (as described in Ref.~\citenum{Loo18a}) for various methods and types of excited states.
}
\label{fig:Set1}
\end{figure*}
@ -261,7 +364,7 @@ In summary, each method has its own strengths and weaknesses, and none of them i
%%% FIG 2 %%%
\begin{figure}
\includegraphics[width=\linewidth]{Set2}
\caption{Mean absolute error (in eV) (with respect to FCI excitation energies) for the doubly excited states reported in Ref.~\onlinecite{Loo19c} for various methods taking into account at least triple excitations.
\caption{Mean absolute error (in eV) (with respect to FCI excitation energies) for the doubly excited states reported in Ref.~\citenum{Loo19c} for various methods taking into account at least triple excitations.
$\%T_1$ corresponds to single excitation percentage in the transition calculated at the CC3 level.}
\label{fig:Set2}
\end{figure}
@ -270,7 +373,7 @@ In summary, each method has its own strengths and weaknesses, and none of them i
%%% FIG 3 %%%
\begin{figure*}
\includegraphics[width=\linewidth]{Set3}
\caption{Mean absolute error (in eV) with respect to the TBE/\emph{aug}-cc-pVTZ values from the {\SetC} set (as described in Ref.~\onlinecite{Loo20}) for various methods and types of excited states.}
\caption{Mean absolute error (in eV) with respect to the TBE/\textit{aug}-cc-pVTZ values from the {\SetC} set (as described in Ref.~\citenum{Loo20}) for various methods and types of excited states.}
\label{fig:Set3}
\end{figure*}
%%% %%% %%%
@ -285,20 +388,19 @@ For excited states, things started moving a little later but some major contribu
%%%%%%%%%%%%%%%%%%%
%%% THIEL'S SET %%%
%%%%%%%%%%%%%%%%%%%
One of these major contributions was provided by the group of Walter Thiel \cite{Sch08,Sil08,Sau09,Sil10b,Sil10c} with the introduction of the so-called Thiel (Mulheim) set of excitation energies. \cite{Sch08}
One of these major contributions was provided by the group of Walter Thiel \cite{Sch08,Sil08,Sau09,Sil10b,Sil10c} with the introduction of the so-called Thiel set of excitation energies. \cite{Sch08}
For the first time, this set was large, diverse, consistent, and accurate enough to be used as a proper benchmarking set for excited-state methods.
More specifically, it gathers a large number of excitation energies consisting of 28 medium-size organic molecules with a total of 223 valence excited states (152 singlet and 71 triplet states) for which theoretical best estimates (TBEs) were defined.
In their first study Thiel and collaborators performed CC2, CCSD, CC3 and CASPT2 calculations (with the TZVP basis) in order to provide (based on additional high-level literature data) TBEs for these transitions.
In their first study Thiel and collaborators performed CC2, CCSD, CC3 and CASPT2 calculations (with the TZVP basis) in order to provide (based on additional high-quality literature data) TBEs for these transitions.
Their main conclusion was that \textit{``CC3 and CASPT2 excitation energies are in excellent agreement for states which are dominated by single excitations''}.
These TBEs were quickly refined with the larger \emph{aug}-cc-pVTZ basis set, \cite{Sil10b} highlighting the importance of diffuse functions.
As a direct evidence of the actual value of reference data, these TBEs were quickly picked up to benchmark various computationally effective methods from semi-empirical to state-of-the-art \textit{ab initio} methods (see the Introduction of Ref.~\onlinecite{Loo18a} and references therein).
These TBEs were quickly refined with the larger \textit{aug}-cc-pVTZ basis set, \cite{Sil10b} highlighting the importance of diffuse functions.
As a direct evidence of the actual value of reference data, these TBEs were quickly picked up to benchmark various computationally effective methods from semi-empirical to state-of-the-art \textit{ab initio} methods (see the \textit{Introduction} of Ref.~\citenum{Loo18a} and references therein).
Theoretical improvements of Thiel's set were slow but steady, highlighting further its quality.
Theoretical improvements of Thiel's set were slow but steady, highlighting further its quality. \cite{Wat13,Kan14,Har14,Kan17}
In 2013, Watson \textit{et al.} \cite{Wat13} computed CCSDT-3/TZVP (an iterative approximation of the triples of CCSDT \cite{Wat96}) excitation energies for the Thiel set.
Their quality were very similar to the CC3 values reported in Ref.~\onlinecite{Sau09} and the authors could not appreciate which model was the most accurate.
Their quality were very similar to the CC3 values reported in Ref.~\citenum{Sau09} and the authors could not appreciate which model was the most accurate.
Similarly, Dreuw and coworkers performed ADC(3) calculations on Thiel's set and arrived at the same kind of conclusion: \cite{Har14}
\textit{``based on the quality of the existing benchmark set it is practically not possible to judge whether ADC(3) or CC3 is more accurate''}.
%Finally, let us mention the work of Kannar and Szalay who reported CCSDT excitation energies \cite{Kan14,Kan17} for a subset of the original Thiel set.
These two studies clearly demonstrate and motivate the need for higher accuracy benchmark excited-states energies.
%%%%%%%%%%%%%%%%%%%%%%%
@ -306,32 +408,32 @@ These two studies clearly demonstrate and motivate the need for higher accuracy
%%%%%%%%%%%%%%%%%%%%%%%
Recently, we made, what we think, is a significant contribution to this quest for highly accurate vertical excitation energies. \cite{Loo18a}
More specifically, we studied 18 small molecules with sizes ranging from one to three non-hydrogen atoms.
For such systems, using a combination of high-order CC methods, SCI calculations and large diffuse basis sets, we were able to compute a list of 110 highly accurate vertical excitation energies for excited states of various natures (valence, Rydberg, $n \ra \pi^*$, $\pi \ra \pi^*$, singlet, triplet and doubly excited) based on CC3/\emph{aug}-cc-pVTZ geometries.
For such systems, using a combination of high-order CC methods, SCI calculations and large diffuse basis sets, we were able to compute a list of 110 highly accurate vertical excitation energies for excited states of various natures (valence, Rydberg, $n \ra \pi^*$, $\pi \ra \pi^*$, singlet, triplet and doubly excited) based on CC3/\textit{aug}-cc-pVTZ geometries.
In the following, we label this set of TBEs as {\SetA}.
Importantly, it allowed us to benchmark a series of popular excited-state wave function methods partially or fully accounting for double and triple excitations (see Fig.~\ref{fig:Set1}): CIS(D), CC2, CCSD, STEOM-CCSD, \cite{Noo97} CCSDR(3), \cite{Chr77} CCSDT-3, \cite{Wat96} CC3, ADC(2), and ADC(3).
Our main conclusion was that CC3 is extremely accurate (with a mean absolute error of only $\sim 0.03$ eV), and that, although slightly less accurate than CC3, CCSDT-3 could be used as a reliable reference for benchmark studies.
Quite surprisingly, ADC(3) was found to have a clear tendency to overcorrect its second-order version ADC(2).
The mean absolute errors (MAEs) obtained for this set can be found in Fig.~\ref{fig:Set1}.
In a second study, \cite{Loo19c} using a similar combination of theoretical models (but mostly extrapolated SCI energies), we provided accurate reference excitation energies for transitions involving a substantial amount of double excitations using a series of increasingly large diffuse-containing atomic basis sets (up to \emph{aug}-cc-pVQZ when technically feasible).
This set gathers 20 vertical transitions from 14 small- and medium-sized molecules, a set we label as {\SetB} in the remaining of this \emph{Perspective}.
An important addition to this second study was the evaluation of various flavors of multiconfigurational methods (CASSCF, CASPT2, and NEVPT2) in addition to high-order CC methods including, at least, perturbative triples (see Fig.~\ref{fig:Set2}).
In a second study, \cite{Loo19c} using a similar combination of theoretical models (but mostly extrapolated SCI energies), we provided accurate reference excitation energies for transitions involving a substantial amount of double excitations using a series of increasingly large diffuse-containing atomic basis sets (up to \textit{aug}-cc-pVQZ when technically feasible).
This set gathers 20 vertical transitions from 14 small- and medium-sized molecules, a set we label as {\SetB} in the remaining of this \textit{Perspective}.
An important addition to this second study was the inclusion of various flavors of multiconfigurational methods (CASSCF, CASPT2, and NEVPT2) in addition to high-order CC methods including, at least, perturbative triples (see Fig.~\ref{fig:Set2}).
Our results clearly evidence that the error in CC methods is intimately related to the amount of double-excitation character in the vertical transition.
For ``pure'' double excitations (\ie, for transitions which do not mix with single excitations), the error in CC3 and CCSDT can easily reach $1$ and $0.5$ eV, respectively, while it goes down to a few tenths of an electronvolt for more common transitions (such as in \emph{trans}-butadiene and benzene) involving a significant amount of singles.\cite{Shu17,Bar18b,Bar18a}
For ``pure'' double excitations (\ie, for transitions which do not mix with single excitations), the error in CC3 and CCSDT can easily reach $1$ and $0.5$ eV, respectively, while it goes down to a few tenths of an electronvolt for more common transitions (such as in \textit{trans}-butadiene and benzene) involving a significant amount of singles.\cite{Shu17,Bar18b,Bar18a}
The quality of the excitation energies obtained with multiconfigurational methods was harder to predict as the overall accuracy of these methods is highly dependent on both the system and the selected active space.
Nevertheless, CASPT2 and NEVPT2 were found to be more accurate for transition with a small percentage of single excitations (error usually below $0.1$ eV) than for excitations dominated by single excitations where the error is closer from $0.1$--$0.2$ eV (see Fig.~\ref{fig:Set2}).
In our latest study, \cite{Loo20} in order to provide more general conclusions, we generated highly accurate vertical transition energies for larger compounds with a set composed by 27 organic molecules encompassing from four to six non-hydrogen atoms for a total of 223 vertical transition energies of various natures.
This set, labeled as {\SetC} and still based on CC3/\emph{aug}-cc-pVTZ geometries, is constituted by a reasonably good balance of singlet, triplet, valence, and Rydberg states.
This set, labeled as {\SetC} and still based on CC3/\textit{aug}-cc-pVTZ geometries, is constituted by a reasonably good balance of singlet, triplet, valence, and Rydberg states.
To obtain this new, larger set of TBEs, we employed CC methods up to the highest possible order (CC3, CCSDT, and CCSDTQ), very large SCI calculations (with up to hundred million determinants), as well as the most robust multiconfigurational method, NEVPT2.
Each approach was applied in combination with diffuse-containing atomic basis sets.
For all the transitions of the {\SetC} set, we reported at least CCSDT/\emph{aug}-cc-pVTZ (sometimes with basis set extrapolation) and CC3/\emph{aug}-cc-pVQZ transition energies as well as CC3/\emph{aug}-cc-pVTZ oscillator strengths for each dipole-allowed transition.
For all the transitions of the {\SetC} set, we reported at least CCSDT/\textit{aug}-cc-pVTZ (sometimes with basis set extrapolation) and CC3/\textit{aug}-cc-pVQZ transition energies as well as CC3/\textit{aug}-cc-pVTZ oscillator strengths for each dipole-allowed transition.
Pursuing our previous benchmarking efforts, \cite{Loo18a,Loo19c} we confirmed that CC3 almost systematically delivers transition energies in agreement with higher-level theoretical models ($\pm 0.04$ eV) except for transitions presenting a dominant double excitation character (see Fig.~\ref{fig:Set3}).
This settles down, at least for now, the debate by demonstrating the superiority of CC3 (in terms of accuracy) compared to methods like CCSDT-3 or ADC(3), see Fig.~\ref{fig:Set3}.
Moreover, thanks to the exhaustive and detailed comparisons made in Ref.~\onlinecite{Loo20}, we could safely conclude that CC3 also regularly outperforms CASPT2 (which often underestimates excitation energies) and NEVPT2 (which typically overestimates excitation energies) as long as the corresponding transition does not show any strong multiple excitation character.
Moreover, thanks to the exhaustive and detailed comparisons made in Ref.~\citenum{Loo20}, we could safely conclude that CC3 also regularly outperforms CASPT2 (which often underestimates excitation energies) and NEVPT2 (which typically overestimates excitation energies) as long as the corresponding transition does not show any strong multiple excitation character.
Our current efforts are now focussing on expanding and merging these sets to create an complete test set of highly accurate excitations energies.
In particular, we are currently generating reference excitations energies for radicals as well as more ``exotic'' molecules containing heavier atoms (such as \ce{Cl}, \ce{P}, and \ce{Si}). \cite{Loo20b}
In particular, we are currently generating reference excitations energies for radicals as well as more ``exotic'' molecules containing heavier atoms (such as \ce{Cl}, \ce{P}, and \ce{Si}).
The combination of these various sets would potentially create an ensemble of more than 400 vertical transition energies for small- and medium-size molecules based on accurate ground-state geometries.
Such a set would definitely be a valuable asset for the entire electronic structure community.
It would likely stimulate further theoretical developments in excited-state methods and provide a fair ground for the assessments of the currently available and under development excited-state models.
@ -344,7 +446,7 @@ This includes, first, 0-0 energies, \cite{Die04b,Hat05c,Goe10a,Sen11b,Win13,Fan1
However, because 0-0 energies are fairly insensitive to the underlying molecular geometries, \cite{Sen11b,Win13,Loo19a} they are not a good indicator of their overall quality.
Consequently, one can find in the literature several sets of excited-state geometries obtained at various levels of theory, \cite{Pag03,Gua13,Bou13,Tun16,Bud17} some of them being determined using state-of-the-art models. \cite{Gua13,Bud17}
There are also investigations of the accuracy of the nuclear gradients at the Franck-Condon point. \cite{Taj18,Taj19}
The interested researcher may find useful several investigations reporting sets of reference oscillator strengths. \cite{Sil10c,Har14,Kan14,Loo18a,Loo20b}
The interested reader may find useful several investigations reporting sets of reference oscillator strengths. \cite{Sil10c,Har14,Kan14,Loo18a,Loo20a}
More complex properties, such as two-photon cross-sections and vibrations, have been mostly determined at lower levels of theory, hinting at future studies on this particular subject.
%%%%%%%%%%%%%%%%%%
@ -353,18 +455,18 @@ More complex properties, such as two-photon cross-sections and vibrations, have
As concluding remarks, we would like to highlight once again the major contribution brought by Roos' and Thiel's groups in an effort to define benchmark values for excited states.
Following their footsteps, we have recently proposed a larger, even more accurate set of vertical transitions energies for various types of excited states (including double excitations). \cite{Loo18a,Loo19c,Loo20}
This was made possible thanks to a technological renaissance of SCI methods which can now routinely produce near-FCI excitation energies for small- and medium-size organic molecules. \cite{Chi18,Gar18,Gar19}
We hope that new technological advances will enable us to push further in years to come our quest to highly accurate excitation energies, and, importantly, of other excited-state properties.
We hope that new technological advances will enable us to push further, in years to come, our quest to highly accurate excitation energies, and, importantly, of other excited-state properties.
%%%%%%%%%%%%%%%%%%%%%%%%
%%% ACKNOWLEDGEMENTS %%%
%%%%%%%%%%%%%%%%%%%%%%%%
PFL would like to thank Peter Gill for useful discussions.
He also acknowledges funding from the \textit{``Centre National de la Recherche Scientifique''}.
DJ acknowledges the \emph{R\'egion des Pays de la Loire} for financial support.
DJ acknowledges the \textit{R\'egion des Pays de la Loire} for financial support.
%%%%%%%%%%%%%%%%%%%%
%%% BIBLIOGRAPHY %%%
%%%%%%%%%%%%%%%%%%%%
\bibliography{ExPerspective,ExPerspective-control}
\bibliography{ExPerspective}
\end{document}

Binary file not shown.

Binary file not shown.