# Overview

## EC-funded publications over time

In [None]:
%%bigquery

SELECT EXTRACT(YEAR FROM DATE(publicationDate)) AS year,
  COUNT(DISTINCT pub.id) AS total
FROM oag_v9_0_1.publications AS pub,
  oag_v9_0_1.relations AS rels,
  oag_v9_0_1.projects AS proj,
  UNNEST(JSON_QUERY_ARRAY(proj.fundings)) AS funds
WHERE pub.id = rels.source
  AND rels.target = proj.id
  AND JSON_VALUE(funds.shortName) = 'EC'
GROUP BY year
HAVING year BETWEEN 2005 AND 2025
ORDER BY year DESC

Query is running:   0%|          |

Downloading:   0%|          |

Unnamed: 0,year,total
0,2025,290
1,2024,45840
2,2023,95885
3,2022,109419
4,2021,110149
5,2020,97088
6,2019,91064
7,2018,86551
8,2017,76872
9,2016,68297


In [None]:
%%bigquery

SELECT EXTRACT(YEAR FROM DATE(pubs.publicationDate)) AS year,
  COUNT(DISTINCT pubs.id) AS total
FROM oag_v9_0_1.publications AS pubs,
  oag_v9_0_1.relations AS rels,
  oag_v9_0_1.projects AS projs,
  UNNEST(JSON_QUERY_ARRAY(projs.fundings)) AS funds,
  UNNEST(JSON_QUERY_ARRAY(pubs.instances)) AS instance
WHERE pubs.id = rels.source
  AND rels.target = projs.id
  AND JSON_VALUE(funds.shortName) = 'EC'
  AND JSON_VALUE(instance.refereed) = 'peerReviewed'
GROUP BY year
HAVING year BETWEEN 2005 AND 2025
ORDER BY year DESC

Query is running:   0%|          |

Downloading:   0%|          |

Unnamed: 0,year,total
0,2025,245
1,2024,42091
2,2023,74611
3,2022,80729
4,2021,83946
5,2020,75548
6,2019,66462
7,2018,64198
8,2017,59533
9,2016,55934


## EC-funded datasets

In [None]:
%%bigquery

SELECT EXTRACT(YEAR FROM DATE(dts.publicationDate)) AS year,
  COUNT(dts.id) AS total
FROM oag_v9_0_1.datasets AS dts,
  oag_v9_0_1.relations AS rels,
  oag_v9_0_1.projects AS projs,
  UNNEST(JSON_QUERY_ARRAY(projs.fundings)) AS funds
WHERE dts.id = rels.source
  AND rels.target = projs.id
  AND JSON_VALUE(funds.shortName) = 'EC'
GROUP BY year
HAVING year BETWEEN 2005 AND 2025
ORDER BY year DESC

Query is running:   0%|          |

Downloading:   0%|          |

Unnamed: 0,year,total
0,2025,6
1,2024,10359
2,2023,18102
3,2022,23708
4,2021,24375
5,2020,16587
6,2019,283416
7,2018,18367
8,2017,13122
9,2016,7603


## FOSs

In [None]:
%%bigquery

SELECT EXTRACT(YEAR FROM DATE(publicationDate)) AS year,
  JSON_VALUE(subject.subject.value) AS fos,
  COUNT(DISTINCT pub.id) AS total
FROM oag_v9_0_1.publications AS pub,
  oag_v9_0_1.relations AS rels,
  oag_v9_0_1.projects AS proj,
  UNNEST(JSON_QUERY_ARRAY(proj.fundings)) AS funds,
  UNNEST(JSON_QUERY_ARRAY(pub.subjects)) AS subject
WHERE pub.id = rels.source
  AND rels.target = proj.id
  AND JSON_VALUE(funds.shortName) = 'EC'
  AND JSON_VALUE(subject.subject.scheme) = 'FOS'
  AND REGEXP_CONTAINS(JSON_VALUE(subject.subject.value), r'^\d{2}\s.*')
GROUP BY year, fos
HAVING year BETWEEN 2005 AND 2025
ORDER BY year DESC, fos ASC

Query is running:   0%|          |

Downloading:   0%|          |

Unnamed: 0,year,fos,total
0,2025,01 natural sciences,9
1,2025,02 engineering and technology,2
2,2025,03 medical and health sciences,1
3,2024,01 natural sciences,996
4,2024,02 engineering and technology,426
...,...,...,...
138,2001,05 social sciences,1
139,2000,01 natural sciences,15
140,2000,02 engineering and technology,4
141,2000,03 medical and health sciences,14


In [None]:
%%bigquery

SELECT
  JSON_VALUE(subject.subject.value) AS fos,
  COUNT(DISTINCT pub.id) AS total
FROM oag_v9_0_1.publications AS pub,
  oag_v9_0_1.relations AS rels,
  oag_v9_0_1.projects AS proj,
  UNNEST(JSON_QUERY_ARRAY(proj.fundings)) AS funds,
  UNNEST(JSON_QUERY_ARRAY(pub.subjects)) AS subject
WHERE pub.id = rels.source
  AND rels.target = proj.id
  AND JSON_VALUE(funds.shortName) = 'EC'
  AND JSON_VALUE(subject.subject.scheme) = 'FOS'
  AND REGEXP_CONTAINS(JSON_VALUE(subject.subject.value), r'^\d{2}\s.*')
GROUP BY fos
ORDER BY fos ASC

Query is running:   0%|          |

Downloading:   0%|          |

Unnamed: 0,fos,total
0,01 natural sciences,277188
1,02 engineering and technology,208819
2,03 medical and health sciences,257865
3,04 agricultural and veterinary sciences,10418
4,05 social sciences,47175
5,06 humanities and the arts,8127


## SDGs

In [None]:
%%bigquery

SELECT EXTRACT(YEAR FROM DATE(publicationDate)) AS year,
  JSON_VALUE(subject.subject.value) AS sdg,
  COUNT(DISTINCT pub.id) AS total
FROM oag_v9_0_1.publications AS pub,
  oag_v9_0_1.relations AS rels,
  oag_v9_0_1.projects AS proj,
  UNNEST(JSON_QUERY_ARRAY(proj.fundings)) AS funds,
  UNNEST(JSON_QUERY_ARRAY(pub.subjects)) AS subject
WHERE pub.id = rels.source
  AND rels.target = proj.id
  AND JSON_VALUE(funds.shortName) = 'EC'
  AND JSON_VALUE(subject.subject.scheme) = 'SDG'
GROUP BY year, sdg
HAVING year BETWEEN 2005 AND 2025
ORDER BY year DESC, sdg ASC

Query is running:   0%|          |

Downloading:   0%|          |

Unnamed: 0,year,sdg,total
0,2025,13. Climate action,2
1,2025,7. Clean energy,1
2,2024,1. No poverty,9
3,2024,10. No inequality,8
4,2024,11. Sustainability,92
...,...,...,...
312,2001,3. Good health,1
313,2001,7. Clean energy,1
314,2000,13. Climate action,1
315,2000,14. Life underwater,1


In [None]:
%%bigquery

SELECT
  JSON_VALUE(subject.subject.value) AS sdg,
  COUNT(DISTINCT pub.id) AS total
FROM oag_v9_0_1.publications AS pub,
  oag_v9_0_1.relations AS rels,
  oag_v9_0_1.projects AS proj,
  UNNEST(JSON_QUERY_ARRAY(proj.fundings)) AS funds,
  UNNEST(JSON_QUERY_ARRAY(pub.subjects)) AS subject
WHERE pub.id = rels.source
  AND rels.target = proj.id
  AND JSON_VALUE(funds.shortName) = 'EC'
  AND JSON_VALUE(subject.subject.scheme) = 'SDG'
GROUP BY sdg
ORDER BY sdg ASC

Query is running:   0%|          |

Downloading:   0%|          |

Unnamed: 0,sdg,total
0,1. No poverty,3155
1,10. No inequality,2278
2,11. Sustainability,9910
3,12. Responsible consumption,6452
4,13. Climate action,21371
5,14. Life underwater,6061
6,15. Life on land,8980
7,16. Peace & justice,5908
8,2. Zero hunger,7249
9,3. Good health,25448


## OA statuses of EC-funded publications


In [None]:
%%bigquery

SELECT EXTRACT(YEAR FROM DATE(publicationDate)) as year,
      JSON_VALUE(bestAccessRight.label) AS OA_status,
      COUNT(pub.id) AS n_papers
FROM oag_v9_0_1.publications AS pub,
  oag_v9_0_1.relations AS rels,
  oag_v9_0_1.projects AS proj,
  UNNEST(JSON_QUERY_ARRAY(proj.fundings)) AS funds
WHERE pub.id = rels.source
  AND rels.target = proj.id
  AND JSON_VALUE(funds.shortName) = 'EC'
GROUP BY year, OA_status
HAVING year BETWEEN 2005 AND 2025
ORDER BY year DESC

Query is running:   0%|          |

Downloading:   0%|          |

Unnamed: 0,year,OA_status,n_papers
0,2025,RESTRICTED,1
1,2025,,49
2,2025,CLOSED,43
3,2025,OPEN,220
4,2024,CLOSED,4010
...,...,...,...
96,2006,CLOSED,30
97,2005,RESTRICTED,4
98,2005,,8
99,2005,OPEN,89


## OA statuses of EC-funded dataets

In [None]:
%%bigquery

SELECT EXTRACT(YEAR FROM DATE(publicationDate)) as year,
      JSON_VALUE(bestAccessRight.label) AS OA_status,
      COUNT(dts.id) AS n_papers
FROM oag_v9_0_1.datasets AS dts,
  oag_v9_0_1.relations AS rels,
  oag_v9_0_1.projects AS proj,
  UNNEST(JSON_QUERY_ARRAY(proj.fundings)) AS funds
WHERE dts.id = rels.source
  AND rels.target = proj.id
  AND JSON_VALUE(funds.shortName) = 'EC'
GROUP BY year, OA_status
HAVING year BETWEEN 2005 AND 2025
ORDER BY year DESC

Query is running:   0%|          |

Downloading:   0%|          |

Unnamed: 0,year,OA_status,n_papers
0,2025,,1
1,2025,OPEN,5
2,2024,CLOSED,8
3,2024,,7912
4,2024,OPEN,2420
...,...,...,...
66,2007,,21
67,2006,OPEN,11
68,2006,,5
69,2005,,8


## Collaboration between organizations funded by the EC

See if many organization are collaborating in consortium


In [None]:
%%bigquery

SELECT
      COUNT(orgs.id) AS n_orgs, rels.target
FROM oag_v9_0_1.organizations AS orgs,
  oag_v9_0_1.relations AS rels,
  oag_v9_0_1.projects AS proj,
  UNNEST(JSON_QUERY_ARRAY(proj.fundings)) AS ç
WHERE orgs.id = rels.source
  AND rels.target = proj.id
  AND JSON_VALUE(funds.shortName) = 'EC'
GROUP BY rels.target


Query is running:   0%|          |

Downloading:   0%|          |

Unnamed: 0,n_orgs,target
0,27,corda__h2020::e82a72df850d6da20338328aad84c7a9
1,25,corda_____he::0af87e4d62317b62836f35bd7ff3acbc
2,20,corda__h2020::3a422b596a0a2c1e1c465e52be98c4bb
3,44,corda__h2020::1a5ff37d09cd9ab3a666c6c162d19eaf
4,33,corda__h2020::fa7128b8a5c76161880818a479a8a83a
...,...,...
110513,18,corda__h2020::74925949ef993a519be90219971a7f67
110514,18,corda_____he::a3a98bff2b0667bb7c6059856dbcd3e6
110515,18,corda_______::59d54c273ea6743c705e245c8687e5dc
110516,18,corda_____he::c7055d02109db5bba4b41c410da6fc65


In [16]:
%%bigquery

WITH organization_project AS (
  SELECT
    rel.source AS org_id,
    org.legalName AS org_name,
    rel.target AS project_id
  FROM oag_v9_0_1.relations AS rel,
    oag_v9_0_1.projects AS proj,
    oag_v9_0_1.organizations AS org,
    UNNEST(JSON_QUERY_ARRAY(fundings)) AS funding
  WHERE JSON_VALUE(funding, '$.shortName') = 'EC' AND
        rel.relationName = 'isParticipant' AND
        rel.target = proj.id AND
        rel.source = org.id
)

SELECT l.org_id AS left_org,
        l.org_name AS left_name,
        r.org_id AS right_org,
        r.org_name AS right_name,
        COUNT(DISTINCT l.project_id) AS count
FROM organization_project AS l
      JOIN
        organization_project AS r
      ON l.project_id = r.project_id AND
        l.org_id < r.org_id
GROUP BY l.org_id, r.org_id, l.org_name, r.org_name
ORDER BY count DESC

Query is running:   0%|          |

Downloading:   0%|          |

Unnamed: 0,left_org,left_name,right_org,right_name,count
0,openorgs____::4dee7ea0d1fd1b48c199ee744e21dc13,Helmholtz Association of German Research Centres,openorgs____::cb92d2ed6f9a724e1c181a734c59f713,Forschungszentrum Jülich,561
1,openorgs____::76681f01bcfcc1ff3405bed86eea99b2,Fraunhofer Society,pending_org_::ec98a602fa61f571dfe03106a1ade993,COMMISSARIAT A L ENERGIE ATOMIQUE ET AUX ENERG...,360
2,openorgs____::4dee7ea0d1fd1b48c199ee744e21dc13,Helmholtz Association of German Research Centres,openorgs____::7fbdf9cd4423c4604745a16afe728bc7,French National Centre for Scientific Research,353
3,openorgs____::7fbdf9cd4423c4604745a16afe728bc7,French National Centre for Scientific Research,pending_org_::ec98a602fa61f571dfe03106a1ade993,COMMISSARIAT A L ENERGIE ATOMIQUE ET AUX ENERG...,343
4,openorgs____::7fbdf9cd4423c4604745a16afe728bc7,French National Centre for Scientific Research,openorgs____::d41cf6bd4ab1b1362a44397e0b95c975,National Research Council,327
...,...,...,...,...,...
2327326,openorgs____::e470685843188cc3e8006d032f02b36c,Asociación de Investigación de la Industria Te...,pending_org_::939cbdc96365d4e06e805d13d0e5ef92,SERVICIUL DE PROTECTIE SI PAZA,1
2327327,pending_org_::0253607ffa35a07f0cfac48b80b2e8c7,SAP AG,pending_org_::844e35d680937f2467242ab64815809f,SOIDEMER S.L.,1
2327328,openorgs____::91a4a28a7ecc2a5a8a1449ee989b1a7e,Forschungszentrum Telekommunikation Wien,pending_org_::a313c04a0b0c20e21bb5225080b2ddb2,OPTIBASE LTD,1
2327329,openorgs____::28bf88ea47bc4867eb58c8981271a6e0,Dortmund University of Applied Sciences and Arts,pending_org_::a7b3b0086fed0a97d5a417f8b3b63a7e,DAIKIN EUROPE N.V.,1
