In [1]:
import pandas as pd

import json

from copy import deepcopy
In [301]:
import warnings
In [214]:
%matplotlib inline

Initial exploration and helper functions

In [4]:
arxiv = pd.read_json('arxiv-metadata-oai-snapshot.json', lines=True, nrows=10)
---------------------------------------------------------------------------
MemoryError                               Traceback (most recent call last)
<ipython-input-4-07635bb615eb> in <module>
----> 1 arxiv = pd.read_json('arxiv-metadata-oai-snapshot.json', lines=True, nrows=10)

~\Anaconda3\lib\site-packages\pandas\util\_decorators.py in wrapper(*args, **kwargs)
    197                 else:
    198                     kwargs[new_arg_name] = new_arg_value
--> 199             return func(*args, **kwargs)
    200 
    201         return cast(F, wrapper)

~\Anaconda3\lib\site-packages\pandas\util\_decorators.py in wrapper(*args, **kwargs)
    294                 )
    295                 warnings.warn(msg, FutureWarning, stacklevel=stacklevel)
--> 296             return func(*args, **kwargs)
    297 
    298         return wrapper

~\Anaconda3\lib\site-packages\pandas\io\json\_json.py in read_json(path_or_buf, orient, typ, dtype, convert_axes, convert_dates, keep_default_dates, numpy, precise_float, date_unit, encoding, lines, chunksize, compression, nrows)
    610         chunksize=chunksize,
    611         compression=compression,
--> 612         nrows=nrows,
    613     )
    614 

~\Anaconda3\lib\site-packages\pandas\io\json\_json.py in __init__(self, filepath_or_buffer, orient, typ, dtype, convert_axes, convert_dates, keep_default_dates, numpy, precise_float, date_unit, encoding, lines, chunksize, compression, nrows)
    678 
    679         data = self._get_data_from_filepath(filepath_or_buffer)
--> 680         self.data = self._preprocess_data(data)
    681 
    682     def _preprocess_data(self, data):

~\Anaconda3\lib\site-packages\pandas\io\json\_json.py in _preprocess_data(self, data)
    691             data = data.read()
    692         if not hasattr(data, "read") and (self.chunksize or self.nrows):
--> 693             data = StringIO(data)
    694 
    695         return data

MemoryError: 
In [8]:
with open('tmp.txt') as f: 
    tmp = json.loads(f.read())
In [10]:
tmp.keys()
Out[10]:
dict_keys(['id', 'submitter', 'authors', 'title', 'comments', 'journal-ref', 'doi', 'report-no', 'categories', 'license', 'abstract', 'versions', 'update_date', 'authors_parsed'])
In [81]:
def get_line_count(filename):
    counter = 0
    with open(filename) as f: 
        for line in f:
            counter +=1
    return counter
In [83]:
get_line_count('arxiv-metadata-oai-snapshot.json')
Out[83]:
1796911
In [86]:
1800000/1000*0.6
Out[86]:
1080.0
In [17]:
def read_n_entries(filename,n):
    with open(filename) as f: 
        head = [json.loads(next(f)) for x in range(n)];
    return head
In [73]:
def parse_json(entry): 
    keys = ['id','authors','title','categories','versions','authors_parsed','doi']
    keys_binary = ['journal-ref','doi','report-no']
    out = {k: deepcopy(entry[k]) for k in keys}
    out['is_published'] = any([(entry[k] != None) for k in keys_binary])
    return out
In [74]:
def read_parse_n_entries(filename,n):
    with open(filename) as f: 
        head = [parse_json(json.loads(next(f))) for x in range(n)];
    return head
In [89]:
def read_parse_all_entries_df(filename):
    out = []
    with open(filename) as f: 
        for line in f:
            out.append(parse_json(json.loads(line)))
    return pd.DataFrame(out)
In [63]:
tmpj = read_n_entries('arxiv-metadata-oai-snapshot.json',10)
In [79]:
pd.DataFrame(read_parse_n_entries('arxiv-metadata-oai-snapshot.json',1000)).info(memory_usage="deep")
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1000 entries, 0 to 999
Data columns (total 8 columns):
 #   Column          Non-Null Count  Dtype 
---  ------          --------------  ----- 
 0   id              1000 non-null   object
 1   authors         1000 non-null   object
 2   title           1000 non-null   object
 3   categories      1000 non-null   object
 4   versions        1000 non-null   object
 5   authors_parsed  1000 non-null   object
 6   doi             659 non-null    object
 7   is_published    1000 non-null   bool  
dtypes: bool(1), object(7)
memory usage: 596.4 KB
In [80]:
pd.DataFrame(read_n_entries('arxiv-metadata-oai-snapshot.json',1000)).info(memory_usage="deep")
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1000 entries, 0 to 999
Data columns (total 14 columns):
 #   Column          Non-Null Count  Dtype 
---  ------          --------------  ----- 
 0   id              1000 non-null   object
 1   submitter       1000 non-null   object
 2   authors         1000 non-null   object
 3   title           1000 non-null   object
 4   comments        901 non-null    object
 5   journal-ref     573 non-null    object
 6   doi             659 non-null    object
 7   report-no       78 non-null     object
 8   categories      1000 non-null   object
 9   license         58 non-null     object
 10  abstract        1000 non-null   object
 11  versions        1000 non-null   object
 12  update_date     1000 non-null   object
 13  authors_parsed  1000 non-null   object
dtypes: object(14)
memory usage: 1.8 MB
In [62]:
df = pd.DataFrame(read_n_entries('arxiv-metadata-oai-snapshot.json',10))

Read the whole parsed json

In [90]:
%%time
arxiv = read_parse_all_entries_df('arxiv-metadata-oai-snapshot.json')
Wall time: 2min 16s
In [91]:
arxiv.info(memory_usage="deep")
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1796911 entries, 0 to 1796910
Data columns (total 8 columns):
 #   Column          Dtype 
---  ------          ----- 
 0   id              object
 1   authors         object
 2   title           object
 3   categories      object
 4   versions        object
 5   authors_parsed  object
 6   doi             object
 7   is_published    bool  
dtypes: bool(1), object(7)
memory usage: 1.1 GB

Categories statistics

In [92]:
arxiv['categories'].value_counts()
Out[92]:
astro-ph                                         86914
hep-ph                                           73550
quant-ph                                         53966
hep-th                                           53287
cond-mat.mtrl-sci                                30107
                                                 ...  
physics.class-ph cond-mat.mtrl-sci gr-qc             1
cs.CG math.GT math.MG                                1
cs.CL cs.SI q-fin.ST                                 1
stat.ML cs.LG math.OC math.ST stat.AP stat.TH        1
math.AG cs.SC math.CV                                1
Name: categories, Length: 62055, dtype: int64
In [94]:
arxiv['categories'].apply(lambda x: len(x.split(' '))).value_counts()
Out[94]:
1     1025259
2      502711
3      187804
4       60999
5       16025
6        3404
7         541
8         121
9          30
10         14
11          2
13          1
Name: categories, dtype: int64

So we have ca. 2/3 entries with a single classification, and rest belongs to more than 1 category

Let's look at the extreme side:

In [95]:
arxiv['categories'].apply(lambda x: len(x.split(' '))).sort_values(ascending=False).head(20)
Out[95]:
77549      13
57365      11
1545826    11
1777614    10
1688950    10
77796      10
1677040    10
1463715    10
1638391    10
1796672    10
1772146    10
19444      10
18505      10
141660     10
1543928    10
1675693    10
1736009    10
1531230     9
1383087     9
158233      9
Name: categories, dtype: int64
In [101]:
arxiv['n_categories'] = arxiv['categories'].apply(lambda x: len(x.split(' ')))
In [97]:
arxiv.iloc[77549]['title']
Out[97]:
'The finite harmonic oscillator and its associated sequences'
In [98]:
arxiv.iloc[57365]['title']
Out[98]:
'Visco-potential free-surface flows and long wave modelling'
In [100]:
arxiv.iloc[1545826]
Out[100]:
id                                                       cs/0410017
authors                    Carl S. McTague and James P. Crutchfield
title             Automated Pattern Detection--An Algorithm for ...
categories        cs.CV cond-mat.stat-mech cs.CL cs.DS cs.IR cs....
versions          [{'version': 'v1', 'created': 'Thu, 7 Oct 2004...
authors_parsed    [[McTague, Carl S., ], [Crutchfield, James P., ]]
doi                                                            None
is_published                                                   True
Name: 1545826, dtype: object

Look at the single categories

In [103]:
arxiv.query('n_categories == 1')['categories'].unique()
Out[103]:
array(['hep-ph', 'physics.gen-ph', 'math.CO', 'cond-mat.mes-hall',
       'gr-qc', 'cond-mat.mtrl-sci', 'astro-ph', 'math.NT', 'hep-th',
       'hep-ex', 'math.NA', 'nlin.PS', 'math.RA', 'cond-mat.str-el',
       'physics.pop-ph', 'nucl-th', 'math.FA', 'cs.DS', 'math.DS',
       'physics.soc-ph', 'math.AG', 'math.OA', 'math.PR', 'math.DG',
       'physics.optics', 'math.GR', 'nlin.SI', 'math.SG',
       'physics.data-an', 'cs.CC', 'math.GT', 'quant-ph',
       'cond-mat.other', 'math.CV', 'math.AP', 'cond-mat.supr-con',
       'math.RT', 'cond-mat.stat-mech', 'q-bio.OT', 'physics.plasm-ph',
       'nlin.CG', 'nucl-ex', 'cond-mat.soft', 'physics.comp-ph',
       'math.MG', 'math.QA', 'physics.bio-ph', 'physics.chem-ph',
       'math.AT', 'physics.geo-ph', 'q-bio.BM', 'math.OC', 'cs.CR',
       'physics.class-ph', 'q-bio.PE', 'q-bio.NC', 'physics.atom-ph',
       'math.GM', 'hep-lat', 'math.CA', 'physics.atm-clus', 'cs.PF',
       'physics.acc-ph', 'math.SP', 'nlin.CD', 'physics.hist-ph',
       'physics.flu-dyn', 'cond-mat.dis-nn', 'cs.CV', 'cs.LG', 'cs.SE',
       'physics.ed-ph', 'physics.ins-det', 'cs.PL', 'q-bio.CB', 'cs.AI',
       'math.LO', 'cs.LO', 'stat.AP', 'nlin.AO', 'cs.DC', 'cs.DM',
       'cs.NI', 'cs.OH', 'q-bio.GN', 'q-bio.MN', 'math.KT', 'math.AC',
       'physics.med-ph', 'cs.HC', 'cs.NE', 'physics.ao-ph', 'math.HO',
       'q-bio.QM', 'cs.MS', 'physics.space-ph', 'cs.DB', 'cs.CL',
       'math.CT', 'cs.CE', 'cs.GT', 'cs.CY', 'cs.CG', 'stat.ME', 'cs.RO',
       'cs.GL', 'cs.MA', 'math.GN', 'cs.IR', 'stat.ML', 'cs.DL', 'cs.SC',
       'q-bio.SC', 'stat.CO', 'cs.NA', 'cs.AR', 'q-bio.TO', 'cs.GR',
       'cs.OS', 'cs.MM', 'cs.SD', 'cond-mat.quant-gas', 'q-fin.GN',
       'q-fin.ST', 'q-fin.PM', 'q-fin.PR', 'q-fin.CP', 'q-fin.RM',
       'astro-ph.HE', 'astro-ph.SR', 'astro-ph.GA', 'astro-ph.CO',
       'astro-ph.IM', 'astro-ph.EP', 'q-fin.TR', 'cs.FL', 'stat.OT',
       'cs.SY', 'cs.SI', 'cs.ET', 'eess.SP', 'q-fin.EC', 'q-fin.MF',
       'physics.app-ph', 'econ.TH', 'eess.IV', 'econ.EM', 'eess.AS',
       'cond-mat'], dtype=object)
In [108]:
versions = arxiv.iloc[0]['versions']
In [109]:
versions
Out[109]:
[{'version': 'v1', 'created': 'Mon, 2 Apr 2007 19:18:42 GMT'},
 {'version': 'v2', 'created': 'Tue, 24 Jul 2007 20:10:27 GMT'}]
In [154]:
def extract_dt_submission(versions_list):
    tmp = pd.to_datetime([item['created'] for item in versions_list if item['version']=='v1'][0])    
    return tmp
In [156]:
arxiv.head(100)['versions'].apply(extract_dt_submission).memory_usage(deep=True)
Out[156]:
928
In [160]:
%%time
arxiv['submitted'] = arxiv['versions'].apply(extract_dt_submission)
Wall time: 11min 25s
In [161]:
arxiv.head()['submitted']
Out[161]:
0   2007-04-02 19:18:42+00:00
1   2007-03-31 02:26:18+00:00
2   2007-04-01 20:46:54+00:00
3   2007-03-31 03:16:14+00:00
4   2007-04-02 18:09:58+00:00
Name: submitted, dtype: datetime64[ns, UTC]
In [162]:
arxiv.info(memory_usage="deep")
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 1796911 entries, 0 to 1796910
Data columns (total 10 columns):
 #   Column          Dtype              
---  ------          -----              
 0   id              object             
 1   authors         object             
 2   title           object             
 3   categories      object             
 4   versions        object             
 5   authors_parsed  object             
 6   doi             object             
 7   is_published    bool               
 8   n_categories    int64              
 9   submitted       datetime64[ns, UTC]
dtypes: bool(1), datetime64[ns, UTC](1), int64(1), object(7)
memory usage: 1.1 GB
In [164]:
%%time
arxiv['n_versions'] = arxiv['versions'].apply(lambda x: len(x))
Wall time: 1.01 s
In [165]:
arxiv.head()
Out[165]:
id authors title categories versions authors_parsed doi is_published n_categories submitted n_versions
0 0704.0001 C. Bal\'azs, E. L. Berger, P. M. Nadolsky, C.-... Calculation of prompt diphoton production cros... hep-ph [{'version': 'v1', 'created': 'Mon, 2 Apr 2007... [[Bal√°zs, C., ], [Berger, E. L., ], [Nadolsky,... 10.1103/PhysRevD.76.013009 True 1 2007-04-02 19:18:42+00:00 2
1 0704.0002 Ileana Streinu and Louis Theran Sparsity-certifying Graph Decompositions math.CO cs.CG [{'version': 'v1', 'created': 'Sat, 31 Mar 200... [[Streinu, Ileana, ], [Theran, Louis, ]] None False 2 2007-03-31 02:26:18+00:00 2
2 0704.0003 Hongjun Pan The evolution of the Earth-Moon system based o... physics.gen-ph [{'version': 'v1', 'created': 'Sun, 1 Apr 2007... [[Pan, Hongjun, ]] None False 1 2007-04-01 20:46:54+00:00 3
3 0704.0004 David Callan A determinant of Stirling cycle numbers counts... math.CO [{'version': 'v1', 'created': 'Sat, 31 Mar 200... [[Callan, David, ]] None False 1 2007-03-31 03:16:14+00:00 1
4 0704.0005 Wael Abu-Shammala and Alberto Torchinsky From dyadic $\Lambda_{\alpha}$ to $\Lambda_{\a... math.CA math.FA [{'version': 'v1', 'created': 'Mon, 2 Apr 2007... [[Abu-Shammala, Wael, ], [Torchinsky, Alberto, ]] None True 2 2007-04-02 18:09:58+00:00 1
In [185]:
%%time
arxiv.to_pickle('arxiv.pickle')
Wall time: 29.9 s
In [192]:
arxiv['id'].value_counts()
Out[192]:
math-ph/0409039    2
math-ph/0207039    2
math-ph/0408005    2
math-ph/0212014    2
1508.04881         1
                  ..
1703.06949         1
1806.09726         1
1310.4549          1
1301.1009          1
2001.09869         1
Name: id, Length: 1796907, dtype: int64
In [193]:
arxiv.query('id == "math-ph/0409039"')
Out[193]:
id authors title categories versions authors_parsed doi is_published n_categories submitted n_versions
1681958 math-ph/0409039 Matthew Cargo, Alfonso Gracia-Saz, R. G. Littl... Moyal star product approach to the Bohr-Sommer... math-ph math.MP [{'version': 'v1', 'created': 'Fri, 17 Sep 200... [[Cargo, Matthew, ], [Gracia-Saz, Alfonso, ], ... 10.1088/0305-4470/38/9/010 True 2 2004-09-17 21:35:01+00:00 1
1733816 math-ph/0409039 Matthew Cargo, Alfonso Gracia-Saz, R. G. Littl... Moyal star product approach to the Bohr-Sommer... math-ph math.MP math.SG [{'version': 'v1', 'created': 'Fri, 17 Sep 200... [[Cargo, Matthew, ], [Gracia-Saz, Alfonso, ], ... 10.1088/0305-4470/38/9/010 True 3 2004-09-17 21:35:01+00:00 1
In [199]:
arxiv.drop(index=[1681958],inplace=True)
In [200]:
arxiv.query('id == "math-ph/0207039"')
Out[200]:
id authors title categories versions authors_parsed doi is_published n_categories submitted n_versions
1680284 math-ph/0207039 Harald Schmid Bound State Solutions of the Dirac Equation in... math-ph gr-qc math.MP [{'version': 'v1', 'created': 'Fri, 26 Jul 200... [[Schmid, Harald, ]] 10.1002/mana.200410205 True 3 2002-07-26 13:24:04+00:00 2
1725442 math-ph/0207039 Harald Schmid Bound State Solutions of the Dirac Equation in... math-ph gr-qc math.MP [{'version': 'v1', 'created': 'Fri, 26 Jul 200... [[Schmid, Harald, ]] 10.1002/mana.200410205 True 3 2002-07-26 13:24:04+00:00 2
In [197]:
bla.drop(index=[0],inplace=True)
In [198]:
bla
Out[198]:
id authors title categories versions authors_parsed doi is_published n_categories submitted n_versions
1 0704.0002 Ileana Streinu and Louis Theran Sparsity-certifying Graph Decompositions math.CO cs.CG [{'version': 'v1', 'created': 'Sat, 31 Mar 200... [[Streinu, Ileana, ], [Theran, Louis, ]] None False 2 2007-03-31 02:26:18+00:00 2
2 0704.0003 Hongjun Pan The evolution of the Earth-Moon system based o... physics.gen-ph [{'version': 'v1', 'created': 'Sun, 1 Apr 2007... [[Pan, Hongjun, ]] None False 1 2007-04-01 20:46:54+00:00 3
3 0704.0004 David Callan A determinant of Stirling cycle numbers counts... math.CO [{'version': 'v1', 'created': 'Sat, 31 Mar 200... [[Callan, David, ]] None False 1 2007-03-31 03:16:14+00:00 1
4 0704.0005 Wael Abu-Shammala and Alberto Torchinsky From dyadic $\Lambda_{\alpha}$ to $\Lambda_{\a... math.CA math.FA [{'version': 'v1', 'created': 'Mon, 2 Apr 2007... [[Abu-Shammala, Wael, ], [Torchinsky, Alberto, ]] None True 2 2007-04-02 18:09:58+00:00 1
In [201]:
arxiv.drop(index=[1680284],inplace=True)
In [200]:
arxiv.query('id == "math-ph/0207039"')
Out[200]:
id authors title categories versions authors_parsed doi is_published n_categories submitted n_versions
1680284 math-ph/0207039 Harald Schmid Bound State Solutions of the Dirac Equation in... math-ph gr-qc math.MP [{'version': 'v1', 'created': 'Fri, 26 Jul 200... [[Schmid, Harald, ]] 10.1002/mana.200410205 True 3 2002-07-26 13:24:04+00:00 2
1725442 math-ph/0207039 Harald Schmid Bound State Solutions of the Dirac Equation in... math-ph gr-qc math.MP [{'version': 'v1', 'created': 'Fri, 26 Jul 200... [[Schmid, Harald, ]] 10.1002/mana.200410205 True 3 2002-07-26 13:24:04+00:00 2
In [202]:
arxiv.query('id == "math-ph/0408005"')
Out[202]:
id authors title categories versions authors_parsed doi is_published n_categories submitted n_versions
1681863 math-ph/0408005 Kurt Ehlers, Jair Koiller, Richard Montgomery,... Nonholonomic systems via moving frames: Cartan... math-ph math.MP [{'version': 'v1', 'created': 'Mon, 2 Aug 2004... [[Ehlers, Kurt, ], [Koiller, Jair, ], [Montgom... None True 2 2004-08-02 17:43:10+00:00 1
1733815 math-ph/0408005 Kurt Ehlers, Jair Koiller, Richard Montgomery,... Nonholonomic systems via moving frames: Cartan... math-ph math.MP math.SG [{'version': 'v1', 'created': 'Mon, 2 Aug 2004... [[Ehlers, Kurt, ], [Koiller, Jair, ], [Montgom... None True 3 2004-08-02 17:43:10+00:00 1
In [203]:
arxiv.drop(index=[1681863],inplace=True)
In [204]:
arxiv.query('id == "math-ph/0212014"')
Out[204]:
id authors title categories versions authors_parsed doi is_published n_categories submitted n_versions
1680561 math-ph/0212014 Pedro de M. Rios A semiclassically entangled puzzle math-ph math.MP quant-ph [{'version': 'v1', 'created': 'Wed, 4 Dec 2002... [[Rios, Pedro de M., ]] None True 3 2002-12-04 01:34:01+00:00 1
1733814 math-ph/0212014 Pedro de M. Rios A semiclassically entangled puzzle math-ph math.MP math.SG quant-ph [{'version': 'v1', 'created': 'Wed, 4 Dec 2002... [[Rios, Pedro de M., ]] 10.1088/1751-8113/40/49/F02 True 4 2002-12-04 01:34:01+00:00 1
In [205]:
arxiv.drop(index=[1680561],inplace=True)
In [207]:
%%time
arxiv.to_pickle('arxiv.pickle')
Wall time: 25.2 s

let's look for some patterns

In [254]:
def groupby_2d(array_to_gb, df):
    return df.groupby(array_to_gb)['id'].count().unstack().fillna(0)
In [230]:
def normalize_by_rowsum(df):
    df2 = df.divide(df.sum(axis=1), axis=0)
    return df2

year vs. # cross-disciplinary papers

In [255]:
year_vs_ncat = groupby_2d([arxiv['submitted'].dt.year, arxiv['n_categories']],arxiv)

year_vs_ncat2 = normalize_by_rowsum(year_vs_ncat)
In [256]:
year_vs_ncat.sum(axis=1).plot.bar()
Out[256]:
<AxesSubplot:xlabel='submitted'>
In [425]:
year_vs_ncat2.plot.area(stacked=True)
Out[425]:
<AxesSubplot:xlabel='submitted'>

# papers that are cross-disciplinary increases steadily

In [248]:
plt.scatter(y=year_vs_ncat[1], x=year_vs_ncat.sum(axis=1))
plt.xlabel('# of all papers');
plt.ylabel('# papers of single category');
In [249]:
plt.scatter(y=year_vs_ncat[1]/year_vs_ncat.sum(axis=1), x=year_vs_ncat.sum(axis=1))
plt.xlabel('# of all papers');
plt.ylabel('% papers of single category');

year vs # of papers in a discipline, only for single discipline papers

In [264]:
arxiv_tmp = arxiv.query('n_categories == 1')
year_vs_cat = groupby_2d([arxiv_tmp['submitted'].dt.year, arxiv_tmp['categories']], arxiv_tmp)
In [260]:
pd.options.display.max_rows = 150
pd.options.display.max_columns = 35
In [266]:
year_vs_cat.T
Out[266]:
submitted 1988 1989 1990 1991 1992 1993 1994 1995 1996 1997 1998 1999 2000 2001 2002 2003 2004 2005 2006 2007 2008 2009 2010 2011 2012 2013 2014 2015 2016 2017 2018 2019 2020
categories
astro-ph 0.0 0.0 0.0 0.0 36.0 403.0 901.0 1508.0 2201.0 3357.0 4394.0 5274.0 5913.0 6315.0 6494.0 7280.0 7565.0 8082.0 8485.0 9398.0 9308.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0
astro-ph.CO 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2478.0 2738.0 2656.0 2477.0 2499.0 1008.0 907.0 804.0 825.0 816.0 778.0 760.0
astro-ph.EP 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 519.0 616.0 655.0 638.0 815.0 939.0 969.0 1061.0 1191.0 1318.0 1210.0 767.0
astro-ph.GA 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 4.0 993.0 1014.0 941.0 889.0 921.0 1880.0 2244.0 2453.0 2510.0 2751.0 2555.0 2296.0
astro-ph.HE 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 6.0 1109.0 1108.0 1315.0 1156.0 1454.0 1282.0 1576.0 1481.0 1853.0 1682.0 1768.0 1477.0
astro-ph.IM 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 370.0 398.0 438.0 432.0 377.0 550.0 514.0 579.0 620.0 824.0 640.0 435.0
astro-ph.SR 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 5.0 1875.0 2159.0 2206.0 1954.0 2134.0 2359.0 2207.0 1907.0 1700.0 1908.0 1381.0 1199.0
cond-mat 0.0 0.0 0.0 0.0 187.0 592.0 1104.0 1482.0 1571.0 617.0 646.0 645.0 604.0 583.0 668.0 739.0 24.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0
cond-mat.dis-nn 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 39.0 118.0 166.0 190.0 184.0 186.0 239.0 209.0 274.0 251.0 229.0 144.0 143.0 123.0 135.0 109.0 109.0 104.0 103.0 105.0 129.0 143.0 115.0 92.0 89.0
cond-mat.mes-hall 0.0 0.0 0.0 0.0 0.0 0.0 1.0 1.0 110.0 333.0 350.0 462.0 450.0 514.0 575.0 704.0 835.0 823.0 908.0 952.0 991.0 1049.0 1471.0 1602.0 1447.0 1855.0 1862.0 2182.0 2346.0 2239.0 2270.0 1911.0 1508.0
cond-mat.mtrl-sci 0.0 0.0 0.0 0.0 0.0 2.0 2.0 0.0 46.0 155.0 217.0 249.0 355.0 419.0 632.0 722.0 894.0 988.0 1081.0 1189.0 1230.0 969.0 1139.0 1319.0 1255.0 1675.0 1733.0 2105.0 2429.0 2562.0 2444.0 2123.0 2173.0
cond-mat.other 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 0.0 1.0 25.0 497.0 621.0 547.0 616.0 557.0 303.0 142.0 105.0 60.0 42.0 59.0 63.0 82.0 85.0 61.0 38.0 25.0
cond-mat.quant-gas 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 4.0 0.0 0.0 1.0 1.0 0.0 1.0 300.0 429.0 464.0 420.0 452.0 488.0 546.0 450.0 432.0 415.0 323.0 315.0
cond-mat.soft 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 25.0 80.0 105.0 131.0 200.0 266.0 357.0 403.0 421.0 433.0 396.0 423.0 371.0 366.0 431.0 402.0 403.0 600.0 654.0 702.0 803.0 808.0 783.0 702.0 673.0
cond-mat.stat-mech 0.0 0.0 0.0 0.0 0.0 1.0 3.0 4.0 129.0 448.0 605.0 636.0 746.0 769.0 796.0 894.0 918.0 897.0 808.0 767.0 734.0 671.0 669.0 650.0 586.0 712.0 754.0 718.0 727.0 752.0 713.0 682.0 570.0
cond-mat.str-el 0.0 0.0 0.0 0.0 0.0 1.0 1.0 1.0 84.0 395.0 528.0 597.0 648.0 642.0 683.0 757.0 757.0 915.0 851.0 797.0 915.0 824.0 990.0 1094.0 965.0 1117.0 1209.0 1203.0 1339.0 1322.0 1409.0 1296.0 1035.0
cond-mat.supr-con 0.0 0.0 0.0 0.0 0.0 0.0 2.0 0.0 81.0 311.0 334.0 487.0 478.0 725.0 627.0 590.0 556.0 494.0 539.0 410.0 703.0 643.0 776.0 776.0 711.0 771.0 754.0 695.0 728.0 742.0 737.0 603.0 424.0
cs.AI 0.0 0.0 0.0 0.0 0.0 6.0 14.0 26.0 28.0 18.0 13.0 5.0 37.0 8.0 43.0 39.0 58.0 35.0 57.0 52.0 74.0 107.0 169.0 403.0 438.0 1107.0 411.0 331.0 381.0 598.0 714.0 491.0 607.0
cs.AR 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 0.0 3.0 2.0 0.0 5.0 3.0 17.0 114.0 6.0 7.0 24.0 32.0 31.0 45.0 68.0 47.0 72.0 101.0 102.0 94.0 148.0
cs.CC 0.0 0.0 1.0 1.0 0.0 0.0 0.0 0.0 0.0 0.0 7.0 21.0 4.0 14.0 20.0 18.0 17.0 19.0 31.0 45.0 55.0 81.0 105.0 91.0 113.0 141.0 128.0 153.0 136.0 152.0 128.0 113.0 122.0
cs.CE 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 5.0 7.0 9.0 6.0 11.0 11.0 17.0 3.0 8.0 16.0 16.0 45.0 59.0 74.0 53.0 67.0 87.0 95.0 115.0 159.0
cs.CG 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 5.0 16.0 3.0 3.0 12.0 7.0 4.0 12.0 20.0 26.0 41.0 47.0 62.0 62.0 88.0 122.0 121.0 140.0 153.0 186.0 214.0 161.0 142.0
cs.CL 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 22.0 40.0 85.0 52.0 39.0 29.0 24.0 6.0 14.0 29.0 25.0 42.0 46.0 57.0 83.0 119.0 209.0 289.0 780.0 1295.0 1940.0 2172.0 2510.0
cs.CR 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 5.0 3.0 9.0 6.0 11.0 33.0 44.0 68.0 55.0 68.0 136.0 256.0 228.0 320.0 270.0 356.0 399.0 449.0 704.0 1000.0 1039.0 993.0
cs.CV 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 1.0 8.0 0.0 1.0 10.0 6.0 9.0 17.0 23.0 31.0 57.0 175.0 174.0 255.0 453.0 776.0 1406.0 2358.0 3825.0 5480.0 5322.0 5197.0
cs.CY 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 2.0 2.0 84.0 1.0 7.0 4.0 3.0 1.0 18.0 23.0 35.0 50.0 36.0 80.0 164.0 194.0 256.0 324.0 364.0 429.0 337.0 505.0
cs.DB 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 3.0 5.0 8.0 11.0 25.0 21.0 13.0 21.0 42.0 37.0 47.0 108.0 145.0 233.0 153.0 169.0 163.0 211.0 232.0 244.0 259.0 268.0
cs.DC 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 2.0 8.0 19.0 13.0 71.0 26.0 18.0 36.0 55.0 51.0 49.0 151.0 144.0 174.0 211.0 267.0 400.0 400.0 544.0 671.0 672.0 625.0
cs.DL 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 4.0 12.0 1.0 3.0 5.0 2.0 7.0 16.0 15.0 8.0 13.0 15.0 37.0 49.0 61.0 113.0 86.0 113.0 106.0 140.0 244.0 110.0 126.0
cs.DM 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 4.0 3.0 1.0 5.0 7.0 17.0 28.0 55.0 72.0 87.0 93.0 102.0 63.0 43.0 75.0 132.0 120.0 139.0 97.0 52.0 47.0
cs.DS 0.0 0.0 0.0 1.0 0.0 0.0 0.0 0.0 1.0 0.0 4.0 5.0 8.0 2.0 18.0 15.0 24.0 35.0 35.0 56.0 102.0 147.0 232.0 284.0 285.0 403.0 476.0 531.0 604.0 628.0 734.0 653.0 645.0
cs.ET 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 7.0 15.0 15.0 52.0 78.0 81.0 100.0 100.0 81.0 64.0
cs.FL 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 42.0 60.0 70.0 57.0 79.0 117.0 114.0 86.0 119.0 101.0 132.0 98.0
cs.GL 0.0 0.0 0.0 1.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 1.0 1.0 2.0 1.0 1.0 4.0 0.0 3.0 4.0 5.0 1.0 2.0 0.0 6.0 3.0 1.0 1.0 4.0 3.0 3.0 6.0 4.0
cs.GR 0.0 0.0 1.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 7.0 2.0 3.0 4.0 3.0 5.0 4.0 12.0 10.0 12.0 42.0 30.0 53.0 51.0 86.0 141.0 111.0 119.0
cs.GT 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 7.0 3.0 3.0 7.0 12.0 29.0 41.0 54.0 99.0 120.0 146.0 166.0 220.0 213.0 242.0 261.0 258.0 238.0 211.0
cs.HC 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 1.0 0.0 5.0 4.0 5.0 5.0 4.0 26.0 51.0 41.0 31.0 40.0 29.0 38.0 57.0 95.0 94.0 184.0 215.0 315.0 412.0 518.0
cs.IR 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 1.0 1.0 4.0 3.0 15.0 9.0 18.0 12.0 36.0 67.0 62.0 89.0 98.0 102.0 121.0 109.0 239.0 300.0 220.0 295.0
cs.LG 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 6.0 2.0 2.0 3.0 2.0 15.0 19.0 18.0 32.0 49.0 94.0 88.0 110.0 200.0 233.0 400.0 461.0 628.0 195.0 114.0 479.0
cs.LO 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 4.0 3.0 24.0 22.0 17.0 25.0 29.0 51.0 66.0 82.0 102.0 110.0 193.0 197.0 201.0 245.0 330.0 352.0 372.0 420.0 460.0 357.0 333.0
cs.MA 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 3.0 4.0 5.0 5.0 4.0 14.0 19.0 22.0 19.0 25.0 32.0 27.0 32.0 35.0 74.0 77.0 70.0
cs.MM 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 0.0 0.0 1.0 3.0 3.0 8.0 15.0 41.0 30.0 24.0 24.0 46.0 45.0 72.0 89.0 110.0 65.0 55.0
cs.MS 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 0.0 1.0 5.0 0.0 3.0 3.0 1.0 9.0 5.0 4.0 9.0 7.0 9.0 9.0 7.0 15.0 29.0 32.0 24.0 28.0 35.0 22.0
cs.NA 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 1.0 3.0 1.0 4.0 4.0 2.0 6.0 13.0 19.0 21.0 18.0 15.0 29.0 25.0 26.0 44.0 55.0 49.0 26.0 1.0
cs.NE 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 1.0 0.0 1.0 3.0 7.0 8.0 16.0 12.0 22.0 28.0 21.0 50.0 57.0 67.0 89.0 113.0 119.0 110.0 182.0 262.0 211.0 228.0
cs.NI 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 60.0 8.0 6.0 4.0 13.0 16.0 41.0 32.0 62.0 82.0 113.0 191.0 475.0 338.0 507.0 563.0 584.0 537.0 708.0 756.0 937.0 792.0 600.0
cs.OH 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 4.0 9.0 5.0 6.0 11.0 8.0 17.0 102.0 187.0 68.0 163.0 75.0 181.0 139.0 153.0 117.0 93.0 78.0 77.0 64.0 49.0
cs.OS 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 0.0 1.0 2.0 2.0 3.0 9.0 4.0 16.0 17.0 13.0 22.0 14.0 19.0 16.0 17.0 22.0 30.0 30.0
cs.PF 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 1.0 4.0 1.0 0.0 6.0 8.0 8.0 9.0 21.0 14.0 14.0 19.0 22.0 20.0 23.0 44.0 53.0 43.0 37.0
cs.PL 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 0.0 0.0 3.0 2.0 15.0 13.0 12.0 9.0 32.0 14.0 13.0 38.0 16.0 29.0 66.0 99.0 84.0 129.0 119.0 143.0 172.0 196.0 255.0 242.0 211.0
cs.RO 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 1.0 12.0 6.0 21.0 84.0 44.0 31.0 30.0 46.0 56.0 74.0 121.0 137.0 314.0 564.0 800.0 960.0 1026.0
cs.SC 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 4.0 4.0 6.0 6.0 13.0 5.0 12.0 20.0 19.0 22.0 16.0 44.0 37.0 29.0 44.0 52.0 45.0 36.0 25.0
cs.SD 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 2.0 0.0 0.0 0.0 0.0 0.0 1.0 2.0 9.0 8.0 14.0 8.0 17.0 19.0 53.0 104.0 90.0 7.0 2.0 2.0
cs.SE 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 8.0 7.0 3.0 10.0 17.0 30.0 6.0 13.0 28.0 28.0 41.0 67.0 151.0 144.0 242.0 247.0 470.0 267.0 308.0 459.0 637.0 643.0 671.0
cs.SI 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 6.0 20.0 18.0 18.0 62.0 171.0 157.0 239.0 271.0 200.0 269.0
cs.SY 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 9.0 27.0 95.0 182.0 245.0 376.0 435.0 625.0 658.0 337.0 0.0
econ.EM 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 31.0 158.0 141.0 153.0
econ.TH 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 45.0 83.0 111.0
eess.AS 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 13.0 45.0 129.0
eess.IV 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 20.0 152.0 214.0 223.0
eess.SP 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 1.0 0.0 0.0 216.0 1051.0 1141.0 1255.0
gr-qc 0.0 0.0 0.0 0.0 54.0 268.0 456.0 515.0 567.0 682.0 740.0 813.0 853.0 824.0 831.0 856.0 964.0 1048.0 1075.0 1170.0 1117.0 1167.0 887.0 766.0 810.0 984.0 1045.0 1174.0 1116.0 1157.0 1226.0 1245.0 1145.0
hep-ex 0.0 0.0 0.0 0.0 0.0 0.0 53.0 139.0 142.0 283.0 376.0 620.0 655.0 761.0 738.0 715.0 846.0 812.0 805.0 810.0 867.0 782.0 562.0 922.0 854.0 592.0 600.0 544.0 490.0 568.0 510.0 435.0 303.0
hep-lat 0.0 0.0 0.0 0.0 241.0 267.0 316.0 311.0 415.0 395.0 435.0 416.0 339.0 418.0 405.0 385.0 405.0 476.0 351.0 408.0 340.0 352.0 289.0 258.0 241.0 333.0 263.0 306.0 239.0 285.0 226.0 167.0 93.0
hep-ph 0.0 0.0 0.0 0.0 646.0 1507.0 2062.0 2436.0 2698.0 2893.0 2920.0 3160.0 3075.0 3103.0 3155.0 2926.0 3122.0 2911.0 2970.0 3027.0 3042.0 2979.0 2325.0 2335.0 2208.0 2408.0 2311.0 2513.0 2450.0 2338.0 2295.0 2117.0 1618.0
hep-th 1.0 0.0 0.0 286.0 1172.0 1517.0 1626.0 1753.0 1948.0 2026.0 2015.0 2035.0 2267.0 2186.0 2241.0 2234.0 2220.0 2096.0 2095.0 2151.0 2127.0 2063.0 1567.0 1429.0 1423.0 1557.0 1642.0 1677.0 1640.0 1621.0 1676.0 1657.0 1339.0
math.AC 0.0 0.0 0.0 0.0 0.0 1.0 5.0 1.0 0.0 0.0 2.0 3.0 9.0 9.0 87.0 59.0 84.0 77.0 113.0 123.0 113.0 123.0 181.0 172.0 197.0 270.0 245.0 253.0 293.0 315.0 307.0 269.0 239.0
math.AG 0.0 0.0 0.0 0.0 2.0 1.0 2.0 0.0 9.0 6.0 261.0 311.0 362.0 325.0 352.0 390.0 378.0 462.0 514.0 554.0 592.0 617.0 767.0 819.0 856.0 975.0 1018.0 1034.0 1140.0 1202.0 1145.0 1173.0 961.0
math.AP 0.0 0.0 0.0 0.0 6.0 1.0 0.0 4.0 0.0 5.0 21.0 21.0 41.0 52.0 58.0 130.0 137.0 215.0 384.0 384.0 530.0 685.0 853.0 1029.0 1325.0 1660.0 1930.0 2165.0 2165.0 2476.0 2725.0 2724.0 2473.0
math.AT 0.0 0.0 0.0 0.0 0.0 0.0 0.0 6.0 0.0 2.0 25.0 14.0 31.0 49.0 55.0 69.0 71.0 63.0 86.0 109.0 96.0 162.0 133.0 178.0 171.0 197.0 218.0 224.0 248.0 311.0 305.0 272.0 238.0
math.CA 0.0 0.0 0.0 0.0 3.0 22.0 34.0 19.0 10.0 7.0 20.0 34.0 23.0 40.0 79.0 93.0 99.0 108.0 142.0 234.0 181.0 218.0 334.0 392.0 487.0 544.0 572.0 734.0 762.0 812.0 694.0 598.0 512.0
math.CO 0.0 0.0 0.0 1.0 1.0 6.0 22.0 36.0 9.0 44.0 91.0 75.0 88.0 96.0 136.0 196.0 273.0 329.0 422.0 487.0 567.0 680.0 830.0 1050.0 1114.0 1402.0 1602.0 1663.0 1836.0 2091.0 2176.0 2122.0 1982.0
math.CT 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 4.0 6.0 8.0 10.0 20.0 20.0 18.0 26.0 45.0 25.0 44.0 49.0 69.0 61.0 80.0 94.0 79.0 103.0 85.0 110.0 116.0 113.0
math.CV 0.0 0.0 0.0 0.0 10.0 5.0 10.0 22.0 32.0 22.0 23.0 30.0 51.0 37.0 45.0 57.0 74.0 108.0 100.0 146.0 158.0 163.0 246.0 259.0 253.0 332.0 396.0 376.0 423.0 456.0 413.0 408.0 362.0
math.DG 0.0 0.0 0.0 0.0 9.0 2.0 3.0 10.0 8.0 11.0 118.0 104.0 133.0 144.0 150.0 228.0 258.0 299.0 393.0 462.0 527.0 550.0 683.0 746.0 768.0 914.0 929.0 960.0 905.0 954.0 1018.0 945.0 813.0
math.DS 0.0 0.0 3.0 21.0 17.0 9.0 20.0 21.0 30.0 19.0 16.0 46.0 36.0 50.0 63.0 141.0 140.0 156.0 218.0 226.0 273.0 317.0 371.0 557.0 576.0 679.0 774.0 892.0 882.0 956.0 903.0 948.0 753.0
math.FA 0.0 1.0 10.0 15.0 50.0 45.0 61.0 33.0 46.0 55.0 32.0 58.0 66.0 62.0 75.0 76.0 101.0 127.0 111.0 163.0 248.0 278.0 411.0 502.0 549.0 669.0 762.0 758.0 811.0 872.0 994.0 1017.0 900.0
math.GM 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 7.0 42.0 34.0 41.0 69.0 52.0 109.0 97.0 114.0 142.0 106.0 125.0 99.0 101.0 80.0 122.0 153.0 168.0 160.0 154.0 285.0 241.0
math.GN 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 21.0 15.0 12.0 9.0 41.0 17.0 20.0 18.0 16.0 22.0 31.0 31.0 59.0 70.0 99.0 88.0 91.0 114.0 130.0 130.0 166.0 175.0 119.0
math.GR 0.0 0.0 0.0 1.0 2.0 15.0 13.0 14.0 18.0 19.0 24.0 16.0 32.0 38.0 59.0 86.0 155.0 150.0 165.0 186.0 186.0 246.0 315.0 333.0 317.0 442.0 458.0 514.0 468.0 493.0 526.0 508.0 489.0
math.GT 0.0 0.0 0.0 0.0 0.0 4.0 6.0 3.0 11.0 40.0 112.0 105.0 108.0 107.0 130.0 156.0 196.0 190.0 241.0 233.0 262.0 288.0 299.0 344.0 351.0 416.0 441.0 482.0 461.0 491.0 489.0 505.0 467.0
math.HO 0.0 0.0 0.0 0.0 2.0 1.0 4.0 0.0 0.0 1.0 1.0 7.0 2.0 6.0 10.0 24.0 14.0 13.0 24.0 33.0 32.0 51.0 46.0 52.0 73.0 87.0 107.0 109.0 136.0 92.0 122.0 107.0 89.0
math.KT 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 0.0 0.0 0.0 4.0 11.0 9.0 10.0 10.0 16.0 13.0 23.0 32.0 23.0 18.0 35.0 40.0 42.0 52.0 59.0 48.0 36.0 26.0 49.0 28.0 23.0
math.LO 0.0 1.0 3.0 6.0 43.0 52.0 59.0 63.0 59.0 62.0 47.0 57.0 43.0 53.0 46.0 44.0 66.0 58.0 78.0 90.0 109.0 157.0 152.0 203.0 241.0 285.0 360.0 407.0 432.0 454.0 526.0 459.0 421.0
math.MG 0.0 0.0 0.0 0.0 2.0 0.0 2.0 4.0 1.0 1.0 14.0 15.0 10.0 14.0 13.0 26.0 41.0 26.0 35.0 65.0 44.0 65.0 120.0 108.0 128.0 138.0 193.0 205.0 225.0 164.0 182.0 173.0 149.0
math.NA 0.0 0.0 0.0 0.0 2.0 0.0 0.0 0.0 1.0 0.0 3.0 32.0 24.0 29.0 23.0 31.0 30.0 45.0 72.0 98.0 140.0 148.0 280.0 352.0 483.0 741.0 972.0 1087.0 1296.0 1472.0 1500.0 495.0 0.0
math.NT 0.0 0.0 0.0 0.0 3.0 0.0 8.0 13.0 9.0 20.0 60.0 82.0 72.0 84.0 130.0 166.0 260.0 279.0 346.0 424.0 451.0 513.0 688.0 849.0 970.0 1167.0 1214.0 1315.0 1485.0 1464.0 1532.0 1425.0 1427.0
math.OA 0.0 0.0 0.0 0.0 2.0 0.0 0.0 5.0 4.0 1.0 27.0 49.0 70.0 68.0 71.0 91.0 76.0 95.0 138.0 120.0 94.0 98.0 145.0 157.0 190.0 183.0 227.0 205.0 211.0 186.0 174.0 155.0 139.0
math.OC 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 0.0 0.0 0.0 14.0 15.0 12.0 20.0 25.0 33.0 52.0 80.0 91.0 118.0 139.0 209.0 171.0 378.0 549.0 840.0 963.0 1161.0 1422.0 1647.0 1607.0 1361.0
math.PR 0.0 0.0 0.0 0.0 0.0 1.0 1.0 1.0 0.0 9.0 35.0 25.0 27.0 46.0 78.0 124.0 326.0 517.0 599.0 640.0 595.0 776.0 885.0 1094.0 1145.0 1407.0 1491.0 1539.0 1544.0 1581.0 1671.0 1521.0 1330.0
math.QA 0.0 0.0 0.0 0.0 3.0 0.0 0.0 0.0 1.0 0.0 186.0 127.0 146.0 117.0 137.0 129.0 103.0 117.0 96.0 79.0 93.0 96.0 117.0 109.0 98.0 124.0 128.0 114.0 128.0 116.0 130.0 128.0 74.0
math.RA 0.0 0.0 0.0 0.0 0.0 1.0 0.0 1.0 9.0 8.0 14.0 12.0 27.0 29.0 42.0 35.0 63.0 100.0 96.0 144.0 169.0 190.0 226.0 250.0 289.0 389.0 386.0 422.0 386.0 443.0 434.0 431.0 424.0
math.RT 0.0 0.0 0.0 0.0 3.0 2.0 2.0 10.0 9.0 6.0 18.0 16.0 27.0 31.0 68.0 96.0 91.0 112.0 138.0 185.0 197.0 219.0 280.0 324.0 321.0 392.0 437.0 417.0 451.0 525.0 470.0 423.0 387.0
math.SG 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 6.0 11.0 19.0 24.0 22.0 40.0 43.0 31.0 32.0 55.0 48.0 59.0 66.0 77.0 85.0 94.0 118.0 119.0 86.0 90.0 124.0 99.0 83.0
math.SP 0.0 0.0 0.0 0.0 0.0 1.0 1.0 0.0 1.0 0.0 9.0 16.0 8.0 12.0 12.0 13.0 29.0 28.0 21.0 37.0 30.0 45.0 67.0 78.0 88.0 101.0 108.0 141.0 108.0 139.0 131.0 95.0 63.0
nlin.AO 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 21.0 15.0 13.0 14.0 29.0 27.0 42.0 36.0 29.0 42.0 28.0 31.0 28.0 23.0 32.0 58.0 52.0 72.0 55.0 61.0 56.0
nlin.CD 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 216.0 200.0 205.0 195.0 195.0 185.0 218.0 170.0 198.0 158.0 112.0 136.0 112.0 141.0 146.0 130.0 120.0 131.0 126.0 93.0 59.0
nlin.CG 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 11.0 11.0 8.0 7.0 11.0 14.0 11.0 4.0 9.0 12.0 11.0 13.0 8.0 19.0 9.0 8.0 12.0 12.0 15.0
nlin.PS 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 73.0 64.0 73.0 86.0 90.0 93.0 93.0 103.0 80.0 83.0 44.0 66.0 56.0 74.0 85.0 77.0 99.0 109.0 106.0 84.0 79.0
nlin.SI 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 2.0 89.0 119.0 115.0 101.0 101.0 123.0 147.0 101.0 122.0 128.0 97.0 77.0 95.0 90.0 105.0 82.0 92.0 124.0 84.0 96.0 57.0
nucl-ex 0.0 0.0 0.0 0.0 0.0 0.0 3.0 16.0 39.0 50.0 87.0 150.0 153.0 210.0 260.0 271.0 428.0 397.0 387.0 506.0 485.0 470.0 310.0 351.0 335.0 310.0 271.0 242.0 219.0 244.0 264.0 198.0 194.0
nucl-th 0.0 0.0 0.0 0.0 37.0 251.0 304.0 367.0 473.0 596.0 713.0 736.0 665.0 683.0 775.0 855.0 855.0 793.0 749.0 843.0 756.0 797.0 705.0 614.0 538.0 612.0 584.0 601.0 607.0 625.0 595.0 553.0 459.0
physics.acc-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 4.0 14.0 18.0 25.0 236.0 135.0 44.0 46.0 80.0 37.0 61.0 37.0 46.0 59.0 86.0 172.0 267.0 304.0 278.0 285.0 287.0 288.0 306.0 171.0 195.0
physics.ao-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 2.0 2.0 3.0 10.0 3.0 4.0 23.0 17.0 24.0 35.0 31.0 36.0 35.0 38.0 42.0 42.0 58.0 73.0 75.0 81.0 99.0 113.0 128.0 145.0
physics.app-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 300.0 600.0 658.0 570.0
physics.atm-clus 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 2.0 8.0 8.0 11.0 12.0 20.0 12.0 27.0 14.0 21.0 22.0 22.0 17.0 22.0 18.0 13.0 28.0 23.0 37.0 29.0 52.0 25.0 27.0
physics.atom-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 12.0 44.0 43.0 69.0 75.0 95.0 114.0 117.0 173.0 170.0 209.0 209.0 239.0 235.0 222.0 214.0 233.0 356.0 343.0 365.0 392.0 392.0 463.0 377.0 279.0
physics.bio-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 6.0 0.0 5.0 3.0 6.0 7.0 25.0 43.0 42.0 54.0 49.0 60.0 44.0 34.0 52.0 33.0 47.0 65.0 61.0 148.0 104.0 67.0 74.0
physics.chem-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 7.0 21.0 17.0 20.0 25.0 21.0 31.0 28.0 57.0 68.0 45.0 80.0 71.0 89.0 92.0 77.0 87.0 132.0 172.0 217.0 322.0 389.0 438.0 361.0 432.0
physics.class-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 9.0 15.0 18.0 20.0 17.0 8.0 33.0 18.0 80.0 58.0 119.0 116.0 141.0 89.0 73.0 112.0 120.0 132.0 119.0 165.0 137.0 144.0 185.0 98.0
physics.comp-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 7.0 12.0 11.0 9.0 8.0 20.0 45.0 24.0 23.0 23.0 34.0 33.0 47.0 41.0 31.0 32.0 61.0 77.0 67.0 114.0 151.0 269.0 251.0 222.0
physics.data-an 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 8.0 7.0 10.0 13.0 24.0 19.0 45.0 26.0 32.0 49.0 58.0 39.0 38.0 34.0 34.0 33.0 38.0 48.0 56.0 48.0 33.0 43.0 33.0 32.0
physics.ed-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 4.0 7.0 16.0 12.0 12.0 25.0 19.0 27.0 49.0 43.0 39.0 28.0 20.0 38.0 45.0 45.0 86.0 99.0 112.0 196.0 112.0 155.0 130.0 173.0
physics.flu-dyn 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 8.0 7.0 15.0 20.0 32.0 29.0 50.0 51.0 66.0 108.0 146.0 181.0 223.0 311.0 231.0 314.0 395.0 508.0 501.0 638.0 805.0 878.0 681.0 833.0
physics.gen-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 44.0 52.0 111.0 178.0 206.0 131.0 134.0 162.0 275.0 313.0 378.0 387.0 357.0 423.0 466.0 372.0 324.0 211.0 222.0 365.0 361.0 302.0 323.0 224.0
physics.geo-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 3.0 13.0 9.0 12.0 17.0 23.0 34.0 21.0 37.0 79.0 45.0 59.0 72.0 71.0 73.0 70.0 60.0 94.0 153.0 154.0 175.0 143.0
physics.hist-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 7.0 7.0 4.0 5.0 8.0 10.0 15.0 23.0 28.0 22.0 19.0 23.0 21.0 38.0 93.0 86.0 81.0 98.0 85.0 65.0 76.0 73.0 78.0
physics.ins-det 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 11.0 18.0 18.0 18.0 49.0 44.0 80.0 102.0 130.0 128.0 167.0 124.0 150.0 115.0 128.0 110.0 191.0 225.0 294.0 346.0 380.0 409.0 360.0 318.0
physics.med-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 1.0 2.0 2.0 10.0 13.0 14.0 50.0 44.0 25.0 33.0 36.0 40.0 39.0 62.0 82.0 111.0 105.0 130.0 199.0 174.0 179.0
physics.optics 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 7.0 20.0 16.0 42.0 38.0 51.0 129.0 150.0 193.0 304.0 299.0 380.0 459.0 554.0 565.0 632.0 863.0 1090.0 1225.0 1190.0 1138.0 1104.0 1045.0 874.0
physics.plasm-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 15.0 26.0 26.0 14.0 27.0 38.0 27.0 213.0 49.0 73.0 92.0 127.0 142.0 177.0 237.0 230.0 361.0 396.0 408.0 487.0 583.0 515.0 440.0 437.0
physics.pop-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 11.0 2.0 4.0 1.0 2.0 6.0 1.0 2.0 8.0 12.0 8.0 10.0 12.0 10.0 23.0 25.0 24.0 27.0 43.0 36.0 29.0 50.0 37.0 39.0
physics.soc-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 1.0 0.0 3.0 7.0 3.0 156.0 151.0 170.0 153.0 191.0 111.0 44.0 47.0 62.0 90.0 171.0 182.0 220.0 239.0 211.0 282.0
physics.space-ph 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 1.0 3.0 7.0 5.0 1.0 5.0 12.0 7.0 12.0 7.0 9.0 11.0 22.0 20.0 15.0 33.0 27.0 38.0 87.0 80.0 88.0 78.0 55.0
q-bio.BM 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 20.0 54.0 57.0 51.0 43.0 48.0 42.0 27.0 25.0 28.0 53.0 65.0 78.0 62.0 59.0 50.0 62.0 82.0
q-bio.CB 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 4.0 5.0 11.0 13.0 8.0 9.0 7.0 9.0 7.0 11.0 14.0 9.0 28.0 20.0 36.0 30.0 26.0 23.0
q-bio.GN 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 10.0 12.0 25.0 33.0 25.0 20.0 19.0 18.0 16.0 39.0 104.0 65.0 64.0 51.0 38.0 45.0 39.0 40.0
q-bio.MN 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 5.0 21.0 26.0 23.0 41.0 26.0 28.0 35.0 37.0 42.0 66.0 64.0 76.0 53.0 51.0 51.0 42.0 44.0
q-bio.NC 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 5.0 1.0 1.0 0.0 0.0 9.0 25.0 23.0 50.0 37.0 46.0 40.0 33.0 35.0 70.0 125.0 153.0 173.0 261.0 239.0 251.0 223.0 198.0
q-bio.OT 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 6.0 7.0 13.0 17.0 11.0 9.0 13.0 10.0 15.0 32.0 30.0 28.0 51.0 26.0 34.0 43.0 66.0
q-bio.PE 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 11.0 66.0 72.0 63.0 95.0 91.0 65.0 97.0 91.0 122.0 260.0 232.0 209.0 187.0 191.0 199.0 164.0 253.0
q-bio.QM 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 0.0 0.0 0.0 5.0 11.0 13.0 26.0 40.0 38.0 34.0 26.0 43.0 25.0 60.0 87.0 60.0 75.0 117.0 116.0 108.0 98.0
q-bio.SC 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 7.0 8.0 6.0 7.0 11.0 12.0 3.0 4.0 3.0 12.0 13.0 24.0 23.0 21.0 26.0 14.0 9.0
q-bio.TO 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 8.0 8.0 8.0 14.0 9.0 6.0 5.0 11.0 9.0 20.0 15.0 37.0 38.0 45.0 62.0 41.0 49.0
q-fin.CP 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 6.0 12.0 14.0 7.0 21.0 22.0 31.0 19.0 41.0 34.0 25.0 28.0
q-fin.EC 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 19.0 55.0 54.0 68.0 11.0 0.0 0.0
q-fin.GN 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 4.0 27.0 30.0 54.0 45.0 77.0 33.0 33.0 37.0 24.0 37.0 37.0 64.0
q-fin.MF 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 35.0 63.0 67.0 75.0 74.0 87.0 68.0
q-fin.PM 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 10.0 7.0 16.0 17.0 26.0 24.0 12.0 24.0 30.0 25.0 43.0 24.0
q-fin.PR 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 4.0 35.0 40.0 23.0 33.0 47.0 33.0 28.0 26.0 29.0 23.0 28.0 13.0
q-fin.RM 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 11.0 16.0 20.0 31.0 26.0 23.0 31.0 27.0 38.0 42.0 32.0 37.0
q-fin.ST 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 4.0 28.0 32.0 29.0 28.0 41.0 43.0 36.0 47.0 33.0 37.0 49.0 51.0
q-fin.TR 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 14.0 11.0 13.0 17.0 21.0 25.0 22.0 31.0 20.0 31.0 30.0 26.0
quant-ph 0.0 0.0 0.0 0.0 0.0 0.0 11.0 239.0 369.0 567.0 779.0 1026.0 1226.0 1590.0 1794.0 2045.0 2137.0 2406.0 2429.0 2462.0 2462.0 2638.0 2119.0 2192.0 2167.0 2445.0 2660.0 2755.0 2918.0 3101.0 3177.0 3158.0 3094.0
stat.AP 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 60.0 117.0 99.0 125.0 162.0 161.0 237.0 284.0 284.0 299.0 440.0 549.0 495.0 456.0
stat.CO 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 9.0 16.0 19.0 44.0 38.0 60.0 101.0 110.0 143.0 124.0 188.0 176.0 101.0 104.0
stat.ME 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 100.0 92.0 76.0 119.0 189.0 282.0 410.0 528.0 645.0 715.0 904.0 923.0 783.0 830.0
stat.ML 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 13.0 24.0 42.0 48.0 72.0 59.0 127.0 155.0 243.0 283.0 422.0 92.0 1.0 1.0
stat.OT 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 13.0 8.0 11.0 5.0 22.0 32.0 26.0 41.0 51.0 38.0 33.0

The problem is that some categories disappear once they split into enough subcategories -> look just at the disciplines (encoded before the dot)

In [263]:
arxiv_tmp['categories'].apply(lambda x: x.split('.')[0]).unique()
Out[263]:
array(['hep-ph', 'physics', 'math', 'cond-mat', 'gr-qc', 'astro-ph',
       'hep-th', 'hep-ex', 'nlin', 'nucl-th', 'cs', 'quant-ph', 'q-bio',
       'nucl-ex', 'hep-lat', 'stat', 'q-fin', 'eess', 'econ'],
      dtype=object)
In [265]:
arxiv_tmp = arxiv.query('n_categories == 1')
year_vs_disc = groupby_2d([arxiv_tmp['submitted'].dt.year, arxiv_tmp['categories'].apply(lambda x: x.split('.')[0])], arxiv_tmp)
In [267]:
year_vs_disc
Out[267]:
categories astro-ph cond-mat cs econ eess gr-qc hep-ex hep-lat hep-ph hep-th math nlin nucl-ex nucl-th physics q-bio q-fin quant-ph stat
submitted
1988 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0
1989 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 2.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0
1990 0.0 0.0 2.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 16.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0
1991 0.0 0.0 3.0 0.0 0.0 0.0 0.0 0.0 0.0 286.0 44.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0
1992 36.0 187.0 0.0 0.0 0.0 54.0 0.0 241.0 646.0 1172.0 160.0 0.0 0.0 37.0 0.0 0.0 0.0 0.0 0.0
1993 403.0 596.0 6.0 0.0 0.0 268.0 0.0 267.0 1507.0 1517.0 169.0 0.0 0.0 251.0 0.0 0.0 0.0 0.0 0.0
1994 901.0 1113.0 15.0 0.0 0.0 456.0 53.0 316.0 2062.0 1626.0 254.0 0.0 3.0 304.0 0.0 0.0 0.0 11.0 0.0
1995 1508.0 1489.0 26.0 0.0 0.0 515.0 139.0 311.0 2436.0 1753.0 268.0 0.0 16.0 367.0 0.0 0.0 0.0 239.0 0.0
1996 2201.0 2085.0 29.0 0.0 0.0 567.0 142.0 415.0 2698.0 1948.0 267.0 0.0 39.0 473.0 37.0 0.0 0.0 369.0 0.0
1997 3357.0 2457.0 18.0 0.0 0.0 682.0 283.0 395.0 2893.0 2026.0 339.0 0.0 50.0 596.0 209.0 0.0 0.0 567.0 0.0
1998 4394.0 2951.0 148.0 0.0 0.0 740.0 376.0 435.0 2920.0 2015.0 1191.0 2.0 87.0 713.0 265.0 6.0 0.0 779.0 0.0
1999 5274.0 3398.0 141.0 0.0 0.0 813.0 620.0 416.0 3160.0 2035.0 1310.0 4.0 150.0 736.0 388.0 1.0 0.0 1026.0 0.0
2000 5913.0 3665.0 235.0 0.0 0.0 853.0 655.0 339.0 3075.0 2267.0 1541.0 399.0 153.0 665.0 712.0 1.0 1.0 1226.0 0.0
2001 6315.0 4104.0 294.0 0.0 0.0 824.0 761.0 418.0 3103.0 2186.0 1594.0 401.0 210.0 683.0 704.0 0.0 0.0 1590.0 0.0
2002 6494.0 4582.0 272.0 0.0 0.0 831.0 738.0 405.0 3155.0 2241.0 2063.0 417.0 260.0 775.0 608.0 0.0 0.0 1794.0 0.0
2003 7280.0 5043.0 378.0 0.0 0.0 856.0 715.0 385.0 2926.0 2234.0 2641.0 407.0 271.0 855.0 853.0 68.0 0.0 2045.0 0.0
2004 7565.0 5176.0 418.0 0.0 0.0 964.0 846.0 405.0 3122.0 2220.0 3249.0 423.0 428.0 855.0 1205.0 215.0 0.0 2137.0 0.0
2005 8082.0 5423.0 443.0 0.0 0.0 1048.0 812.0 476.0 2911.0 2096.0 3915.0 435.0 397.0 793.0 1508.0 250.0 0.0 2406.0 0.0
2006 8485.0 5360.0 703.0 0.0 0.0 1075.0 805.0 351.0 2970.0 2095.0 4806.0 511.0 387.0 749.0 1779.0 286.0 0.0 2429.0 0.0
2007 9398.0 5298.0 1192.0 0.0 0.0 1170.0 810.0 408.0 3027.0 2151.0 5581.0 424.0 506.0 843.0 2052.0 327.0 0.0 2462.0 182.0
2008 9323.0 5645.0 1328.0 0.0 0.0 1117.0 867.0 340.0 3042.0 2127.0 6074.0 440.0 485.0 756.0 2173.0 309.0 16.0 2462.0 249.0
2009 7344.0 5248.0 1698.0 0.0 0.0 1167.0 782.0 352.0 2979.0 2063.0 7082.0 415.0 470.0 797.0 2392.0 262.0 131.0 2638.0 236.0
2010 8033.0 6182.0 3193.0 0.0 0.0 887.0 562.0 289.0 2325.0 1567.0 8972.0 290.0 310.0 705.0 2540.0 266.0 148.0 2119.0 349.0
2011 8211.0 6521.0 3358.0 0.0 0.0 766.0 922.0 258.0 2335.0 1429.0 10483.0 322.0 351.0 614.0 2608.0 279.0 169.0 2192.0 469.0
2012 7546.0 5956.0 4311.0 0.0 0.0 810.0 854.0 241.0 2208.0 1423.0 11756.0 302.0 335.0 538.0 2869.0 364.0 178.0 2167.0 573.0
2013 8200.0 7328.0 5936.0 0.0 1.0 984.0 592.0 333.0 2408.0 1557.0 14457.0 341.0 310.0 612.0 3675.0 746.0 259.0 2445.0 880.0
2014 8018.0 7616.0 6667.0 0.0 1.0 1045.0 600.0 263.0 2311.0 1642.0 16292.0 376.0 271.0 584.0 4104.0 733.0 257.0 2660.0 1099.0
2015 8417.0 8319.0 7954.0 0.0 0.0 1174.0 544.0 306.0 2513.0 1677.0 17492.0 366.0 242.0 601.0 4555.0 777.0 311.0 2755.0 1347.0
2016 8285.0 9033.0 10415.0 0.0 0.0 1116.0 490.0 239.0 2450.0 1640.0 18480.0 372.0 219.0 607.0 5318.0 821.0 332.0 2918.0 1447.0
2017 8699.0 9085.0 14571.0 33.0 239.0 1157.0 568.0 285.0 2338.0 1621.0 19978.0 444.0 244.0 625.0 6022.0 823.0 358.0 3101.0 1995.0
2018 9299.0 8947.0 18250.0 203.0 1216.0 1226.0 510.0 226.0 2295.0 1676.0 20817.0 383.0 264.0 595.0 6701.0 864.0 314.0 3177.0 1791.0
2019 8332.0 7770.0 17024.0 224.0 1400.0 1245.0 435.0 167.0 2117.0 1657.0 19211.0 346.0 198.0 553.0 5983.0 762.0 331.0 3158.0 1418.0
2020 6934.0 6812.0 17511.0 264.0 1607.0 1145.0 303.0 93.0 1618.0 1339.0 16632.0 266.0 194.0 459.0 5709.0 862.0 311.0 3094.0 1424.0
In [268]:
year_vs_disc2 = normalize_by_rowsum(year_vs_disc)
In [314]:
with warnings.catch_warnings():
    warnings.simplefilter('ignore')

    ax = year_vs_disc2.plot.area(stacked=True, colormap="nipy_spectral", figsize=(12,6), legend=True);
    year_vs_disc2.rename(columns=dict(zip(year_vs_disc2.columns,["_"+c for c in year_vs_disc2.columns])))\
        .plot.line(stacked=True, color="k", lw=0.75, ax=ax);
    handles, labels = ax.get_legend_handles_labels()
    plt.legend(reversed(handles), reversed(labels), bbox_to_anchor=(1.05, 1))
    plt.xlim([1992,2020])
    plt.ylim([0,1])
    plt.ylabel('% of all submitted papers')
    ax.set_yticklabels([str(round(tick*100)) for tick in ax.get_yticks()])
    plt.xlabel('year')

Note: cond-mat is misleadingly close to cs -> most of the disciplines are anyway related to physics, look for a way to fish out: econ, eess, astro-ph, cs, math, nlin, q-bio, q-fin, stat from the rest -> use colors

disciplines vs multi-categorical papers

In [412]:
arxiv['unique_categories'] = \
    arxiv['categories'].apply(lambda x: list(set([c.split('.')[0] for c in x.split(' ')])))
In [414]:
arxiv['unique_categories'].apply(lambda x: ' '.join(x)).value_counts()
Out[414]:
math                                      315258
astro-ph                                  219695
cond-mat                                  212886
cs                                        176369
physics                                    84304
                                           ...  
eess q-bio nlin                                1
cs math gr-qc stat                             1
astro-ph hep-ph quant-ph nucl-ex gr-qc         1
astro-ph hep-ex hep-ph hep-th nucl-ex          1
cond-mat hep-ph q-fin                          1
Name: unique_categories, Length: 2759, dtype: int64
In [415]:
groupby_2d([arxiv['unique_categories'].apply(lambda x: len(x)), arxiv['n_categories']], arxiv)
Out[415]:
n_categories 1 2 3 4 5 6 7 8 9 10 11 13
unique_categories
1 1025259.0 244231.0 38184.0 4794.0 658.0 24.0 2.0 0.0 0.0 0.0 0.0 0.0
2 0.0 258478.0 75666.0 17790.0 3408.0 386.0 17.0 6.0 0.0 0.0 0.0 0.0
3 0.0 0.0 73952.0 18055.0 5070.0 1052.0 172.0 13.0 1.0 2.0 0.0 0.0
4 0.0 0.0 0.0 20360.0 3650.0 802.0 116.0 22.0 5.0 1.0 1.0 1.0
5 0.0 0.0 0.0 0.0 3239.0 646.0 100.0 23.0 7.0 1.0 1.0 0.0
6 0.0 0.0 0.0 0.0 0.0 494.0 93.0 28.0 6.0 3.0 0.0 0.0
7 0.0 0.0 0.0 0.0 0.0 0.0 41.0 20.0 5.0 5.0 0.0 0.0
8 0.0 0.0 0.0 0.0 0.0 0.0 0.0 9.0 3.0 1.0 0.0 0.0
9 0.0 0.0 0.0 0.0 0.0 0.0 0.0 0.0 3.0 1.0 0.0 0.0
In [416]:
year = 2019
arxiv_tmp = arxiv[arxiv['submitted'].dt.year==year]
groupby_2d([arxiv_tmp['unique_categories'].apply(lambda x: len(x)), arxiv_tmp['n_categories']], arxiv_tmp)
Out[416]:
n_categories 1 2 3 4 5 6 7 8 9
unique_categories
1 72331.0 22837.0 5186.0 712.0 95.0 1.0 0.0 0.0 0.0
2 0.0 27173.0 11375.0 2826.0 553.0 56.0 3.0 0.0 0.0
3 0.0 0.0 6931.0 2673.0 801.0 163.0 18.0 1.0 0.0
4 0.0 0.0 0.0 1389.0 387.0 115.0 17.0 1.0 1.0
5 0.0 0.0 0.0 0.0 206.0 43.0 7.0 0.0 0.0
6 0.0 0.0 0.0 0.0 0.0 15.0 1.0 0.0 0.0
In [417]:
year = 2009
arxiv_tmp = arxiv[arxiv['submitted'].dt.year==year]
groupby_2d([arxiv_tmp['unique_categories'].apply(lambda x: len(x)), arxiv_tmp['n_categories']], arxiv_tmp)
Out[417]:
n_categories 1 2 3 4 5 6 7 8 9 10
unique_categories
1 36056.0 14392.0 817.0 85.0 10.0 5.0 1.0 0.0 0.0 0.0
2 0.0 6467.0 2083.0 371.0 51.0 5.0 0.0 0.0 0.0 0.0
3 0.0 0.0 2109.0 456.0 98.0 11.0 3.0 1.0 0.0 1.0
4 0.0 0.0 0.0 747.0 128.0 25.0 5.0 0.0 1.0 0.0
5 0.0 0.0 0.0 0.0 93.0 26.0 4.0 2.0 2.0 0.0
6 0.0 0.0 0.0 0.0 0.0 11.0 2.0 2.0 0.0 0.0
7 0.0 0.0 0.0 0.0 0.0 0.0 1.0 0.0 0.0 0.0
In [422]:
uniq_disc_vs_year = groupby_2d([arxiv['submitted'].dt.year, arxiv['unique_categories'].apply(lambda x: len(x))], arxiv)
In [423]:
uniq_disc_vs_year2 = normalize_by_rowsum(uniq_disc_vs_year)
In [424]:
uniq_disc_vs_year2.plot.area(stacked=True)
Out[424]:
<AxesSubplot:xlabel='submitted'>

it looks like the majority of the increas in interdisciplinarity comes from bifurcation within a discipline, and not real cross-disciplinary stuff

In [435]:
arxiv_tmp = arxiv[arxiv['unique_categories'].apply(lambda x: len(x))==1].query('n_categories>1')
bifurcating_categories = groupby_2d([arxiv_tmp['submitted'].dt.year, arxiv_tmp['unique_categories'].apply(lambda x: x[0])], arxiv_tmp)
In [437]:
bifurcating_categories.plot.area(stacked=True)
Out[437]:
<AxesSubplot:xlabel='submitted'>
In [439]:
bifurcating_categories.plot.area(subplots=True, figsize=(6,12));
In [432]:
arxiv_tmp = arxiv[arxiv['unique_categories'].apply(lambda x: len(x))>1]
disc_combinations_vs_year = groupby_2d([arxiv_tmp['submitted'].dt.year, arxiv_tmp['unique_categories'].apply(lambda x: ' '.join(x))], arxiv_tmp)
In [443]:
disc_combinations_vs_year.sum().sort_values(ascending=False).head(50)
Out[443]:
unique_categories
cs math                         48886.0
cs stat                         32839.0
math math-ph                    29506.0
hep-th gr-qc                    16511.0
cond-mat quant-ph               16221.0
cs eess                         14329.0
math stat                       13406.0
cond-mat physics                12713.0
hep-ph hep-ex                   11783.0
physics cond-mat                11659.0
astro-ph gr-qc                  11019.0
hep-ph astro-ph                  9659.0
hep-ph nucl-th                   9165.0
physics quant-ph                 8790.0
physics astro-ph                 8205.0
hep-th astro-ph gr-qc            7389.0
cs math stat                     6519.0
hep-th math math-ph              6241.0
hep-th hep-ph                    4720.0
hep-ph hep-th                    4712.0
math math-ph quant-ph            4275.0
hep-th math                      4271.0
cs physics                       4247.0
physics q-bio                    4081.0
physics hep-ex                   3734.0
cond-mat math math-ph            3529.0
cs math eess                     3457.0
hep-ph hep-lat                   3310.0
physics nlin                     3249.0
hep-ph astro-ph gr-qc hep-th     3109.0
physics cs                       3099.0
nucl-ex nucl-th                  3013.0
cond-mat physics quant-ph        2935.0
cond-mat q-bio                   2897.0
math math-ph nlin                2825.0
cond-mat nlin                    2689.0
cond-mat hep-th                  2651.0
cs q-bio                         2512.0
hep-ph nucl-ex nucl-th           2457.0
cs eess stat                     2451.0
cs quant-ph                      2375.0
hep-th cond-mat                  2263.0
hep-ph astro-ph gr-qc            2214.0
physics math                     2179.0
math q-fin                       2167.0
hep-th math gr-qc math-ph        2043.0
hep-ph astro-ph hep-th           1965.0
math q-bio                       1774.0
nucl-ex hep-ex                   1730.0
hep-th quant-ph                  1678.0
dtype: float64

submissions that happen on a particular day of week

In [ ]:
submissions_dow_norm = normalize_by_rowsum( 
    groupby_2d([arxiv['submitted'].dt.year, arxiv['submitted'].dt.dayofweek], arxiv)
)
In [324]:
num_to_dow = {0: "Mon", 1: "Tue", 2: "Wed", 3: "Thu", 4: "Fri", 5: "Sat", 6: "Sun"}
In [325]:
submissions_dow_norm_tmp = submissions_dow_norm.rename(columns=num_to_dow)
print(submissions_dow_norm_tmp.loc[[1994,2020]].T)
axes = submissions_dow_norm_tmp.loc[1992:].plot.area(subplots=True,figsize=(6,12), legend=True);
[ax.legend(bbox_to_anchor=(1.05, 1)) for ax in axes];
submitted      1994      2020
submitted                    
Mon        0.173646  0.183578
Tue        0.193689  0.177590
Wed        0.198750  0.171289
Thu        0.180294  0.170422
Fri        0.180393  0.146289
Sat        0.043362  0.072386
Sun        0.029867  0.078445

Scientists submit on weekends increasingly more than 25 years ago

submissions in 2019, day of week vs discipline (only papers belonging to a single discipline)

In [392]:
def weekday_sub_prop(year, metric="all"):
    arxiv_tmp = arxiv[arxiv['submitted'].dt.year==year].query('n_categories == 1')
    dow_vs_disc = groupby_2d([arxiv_tmp['submitted'].dt.dayofweek, arxiv_tmp['categories'].apply(lambda x: x.split('.')[0])], arxiv_tmp)
    dow_vs_disc = dow_vs_disc.T
    dow_vs_disc['weekend'] = (dow_vs_disc[5]+dow_vs_disc[6])/2
    dow_vs_disc['weekday'] = (dow_vs_disc[[0,1,2,3,4]].sum(axis=1))/5
    dow_vs_disc['total'] = dow_vs_disc[range(7)].sum(axis=1)
    dow_vs_disc['prop'] = dow_vs_disc['weekend']/dow_vs_disc['weekday']
    if metric != "all":
        tmp = dow_vs_disc[metric]
        tmp.name = year
    else: 
        tmp = dow_vs_disc
    return tmp
In [389]:
weekday_sub_prop(2019)
Out[389]:
submitted 0 1 2 3 4 5 6 weekend weekday all prop
categories
astro-ph 1562 1639 1617 1483 1311 360 360 360.0 1522.4 8332 0.236469
cond-mat 1420 1404 1334 1407 1296 401 508 454.5 1372.2 7770 0.331220
cs 2947 3088 2859 2901 2528 1354 1347 1350.5 2864.6 17024 0.471445
econ 33 42 47 33 26 18 25 21.5 36.2 224 0.593923
eess 251 249 237 245 226 92 100 96.0 241.6 1400 0.397351
gr-qc 235 215 204 227 180 78 106 92.0 212.2 1245 0.433553
hep-ex 65 72 57 94 89 28 30 29.0 75.4 435 0.384615
hep-lat 40 30 24 28 30 5 10 7.5 30.4 167 0.246711
hep-ph 437 355 367 384 335 105 134 119.5 375.6 2117 0.318158
hep-th 347 313 288 326 229 64 90 77.0 300.6 1657 0.256154
math 3421 3431 3227 3200 2881 1417 1634 1525.5 3232.0 19211 0.471999
nlin 64 56 67 60 49 28 22 25.0 59.2 346 0.422297
nucl-ex 28 37 44 31 36 12 10 11.0 35.2 198 0.312500
nucl-th 116 73 95 108 83 38 40 39.0 95.0 553 0.410526
physics 998 1151 1083 1019 962 405 365 385.0 1042.6 5983 0.369269
q-bio 142 133 135 126 125 63 38 50.5 132.2 762 0.381997
q-fin 57 67 47 41 49 37 33 35.0 52.2 331 0.670498
quant-ph 566 513 565 578 532 195 209 202.0 550.8 3158 0.366739
stat 240 278 217 230 222 103 128 115.5 237.4 1418 0.486521
In [395]:
weekday_prop_disc_props = pd.DataFrame([weekday_sub_prop(y,'prop') for y in np.arange(1990,2021,1)]).fillna(0)
In [396]:
weekday_prop_disc_props.plot.line(subplots=True, figsize=(6,20));
In [390]:
sunday_disc_props = pd.DataFrame([weekday_sub_prop(y,6) for y in np.arange(1990,2021,1)]).fillna(0)
In [397]:
weekend_disc_props = pd.DataFrame([weekday_sub_prop(y,"weekend")*2 for y in np.arange(1990,2021,1)]).fillna(0)
In [393]:
total_disc_props = pd.DataFrame([weekday_sub_prop(y,"total") for y in np.arange(1990,2021,1)]).fillna(0)
In [394]:
(sunday_disc_props/total_disc_props).plot.line(subplots=True, figsize=(6,20));
In [398]:
(weekend_disc_props/total_disc_props).plot.line(subplots=True, figsize=(6,20));