# **Step#1 Data Collection From FAST-NU Website**

## Necessary Libraries

In [1]:
import pandas as pd
import requests
from bs4 import BeautifulSoup

## FAST School of Computing Faculty Data

In [2]:
URL = "https://lhr.nu.edu.pk/faculty/#fsc"
page = requests.get(URL)
print(page)

<Response [200]>


In [3]:
soup = BeautifulSoup(page.content, "html.parser")
soup.find("div", class_="container", id="fsc")

<div class="container" id="fsc">
<br>
<h1 class="mb-2 mt-3">FAST School of Computing Faculty</h1>
<hr class="mt-0 nu-hr mb-0"/>
<div class="container tab-pane active" id="faculty-tab"><br/>
<div class="row">
<div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/01._Dr_Kashif_Zafar_Prof._CS.JPG"/>
</div>
<div class="card-body pr-0 pl-0 pb-0">
<h5 class="text-center">Dr. Kashif Zafar</h5>
<p class="small text-center font-italic">Professor &amp; HOD
                        
                         <br> HEC Approved PhD Supervisor 
                        
                        </br></p>
<p class="mb-0 text-center">kashif.zafar@nu.edu.pk</p>
<!--  <p class="mt-0 small text-center">ext no: 569</p> -->
<a class="faculty-link" href="/fsc/facultyProfile/1238"></a>
</div>
</div>
</div>
<div class="col-lg-3 col-md-4 col-sm-6 col-12

In [4]:
divs = soup.find(class_="container", id="fsc").find_all(
    class_="col-lg-3 col-md-4 col-sm-6 col-12"
)

## Data Frame Preparation

In [5]:
joint_data = pd.DataFrame()

data_list = []

for div in divs:
    faculty_link = div.find("a", class_="faculty-link")
    href = faculty_link["href"] if faculty_link else None

    new_data = {
        "ID": href.split("/")[-1] if href else None,
        "Name": (
            div.find("h5", class_="text-center").text.strip()
            if div.find("h5", class_="text-center")
            else None
        ),
        "Designation": (
            div.find("p", class_="small text-center font-italic")
            .get_text(separator=" ", strip=True)
            .split("HEC Approved")[0]
            .strip()
            if div.find("p", class_="small text-center font-italic")
            else None
        ),
        "HEC Approved PHD Supervisor": (
            "HEC Approved"
            in div.find("p", class_="small text-center font-italic").get_text(
                separator=" ", strip=True
            )
            if div.find("p", class_="small text-center font-italic")
            else False
        ),
        "Email": (
            div.find("p", class_="mb-0 text-center").text.strip()
            if div.find("p", class_="mb-0 text-center")
            else None
        ),
        "Department": href.split("/")[1] if href else None,
        "ImageURL": (
            div.find(
                "img", class_="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto"
            ).get("src")
            if div.find(
                "img", class_="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto"
            )
            else None
        ),
    }

    data_list.append(new_data)

joint_data = pd.DataFrame(data_list)
joint_data.head()

Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL
0,1238,Dr. Kashif Zafar,Professor & HOD,True,kashif.zafar@nu.edu.pk,fsc,/media/Faculty/01._Dr_Kashif_Zafar_Prof._CS.JPG
1,4027,Dr. Aamir Wali,Professor,True,aamir.wali@nu.edu.pk,fsc,/media/Faculty/51._Dr_Aamir_Wali_Prof._AIDS.JPG
2,4391,Dr. Asif Mahmood Gillani,Professor,True,asif.gilani@nu.edu.pk,fsc,/media/Faculty/02._Dr_Asif_Mehmood_Gilani_Prof...
3,6113,Dr. Asma Naseer,Professor,True,asma.naseer@nu.edu.pk,fsc,/media/Faculty/07._Dr_Asma_Naseer_Assoc._Prof....
4,4329,Dr. Zareen Alamgir,Professor,True,zareen.alamgir@nu.edu.pk,fsc,/media/Faculty/03._Dr_Zareen_Alamgir_Prof._CS.JPG


## Data import to .csv file

In [6]:
joint_data.to_csv("fsc.csv")

## Department of Electrical Engineering Faculty Data

In [7]:
URL = "https://lhr.nu.edu.pk/faculty/#ee"
page = requests.get(URL)
print(page)

<Response [200]>


In [8]:
soup = BeautifulSoup(page.content, "html.parser")
soup.find("div", class_="container", id="ee")

<div class="container" id="ee">
<br/>
<h1 class="mb-2 mt-3">Department of Electrical Engineering Faculty</h1>
<hr class="mt-0 nu-hr mb-0"/>
<div class="container tab-pane active" id="faculty-tab"><br/>
<div class="row">
<div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/98._Dr_Saima_Zafar_Prof._EE.JPG"/>
</div>
<div class="card-body pr-0 pl-0 pb-0">
<h5 class="text-center">Dr. Saima Zafar</h5>
<p class="small text-center font-italic">Professor &amp; HOD
                        
                         <br> HEC Approved PhD Supervisor 
                        
                        </br></p>
<p class="mb-0 text-center">saima.zafar@nu.edu.pk</p>
<!--  <p class="mt-0 small text-center">ext no: 265</p> -->
<a class="faculty-link" href="/ee/facultyProfile/4198"></a>
</div>
</div>
</div>
<div class="col-lg-3 col-md-4 col-sm-

In [9]:
divs = soup.find(class_="container", id="ee").find_all(
    class_="col-lg-3 col-md-4 col-sm-6 col-12"
)
print(divs)

[<div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/98._Dr_Saima_Zafar_Prof._EE.JPG"/>
</div>
<div class="card-body pr-0 pl-0 pb-0">
<h5 class="text-center">Dr. Saima Zafar</h5>
<p class="small text-center font-italic">Professor &amp; HOD
                        
                         <br> HEC Approved PhD Supervisor 
                        
                        </br></p>
<p class="mb-0 text-center">saima.zafar@nu.edu.pk</p>
<!--  <p class="mt-0 small text-center">ext no: 265</p> -->
<a class="faculty-link" href="/ee/facultyProfile/4198"></a>
</div>
</div>
</div>, <div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/99._Dr_S_M_Sajid_Prof._EE.JPG"/>
</di

## Data Frame Preparation

In [10]:
joint_data = pd.DataFrame()

data_list = []

for div in divs:
    faculty_link = div.find("a", class_="faculty-link")
    href = faculty_link["href"] if faculty_link else None

    new_data = {
        "ID": href.split("/")[-1] if href else None,
        "Name": (
            div.find("h5", class_="text-center").text.strip()
            if div.find("h5", class_="text-center")
            else None
        ),
        "Designation": (
            div.find("p", class_="small text-center font-italic")
            .get_text(separator=" ", strip=True)
            .split("HEC Approved")[0]
            .strip()
            if div.find("p", class_="small text-center font-italic")
            else None
        ),
        "HEC Approved PHD Supervisor": (
            "HEC Approved"
            in div.find("p", class_="small text-center font-italic").get_text(
                separator=" ", strip=True
            )
            if div.find("p", class_="small text-center font-italic")
            else False
        ),
        "Email": (
            div.find("p", class_="mb-0 text-center").text.strip()
            if div.find("p", class_="mb-0 text-center")
            else None
        ),
        "Department": href.split("/")[1] if href else None,
        "ImageURL": (
            div.find(
                "img", class_="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto"
            ).get("src")
            if div.find(
                "img", class_="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto"
            )
            else None
        ),
    }

    data_list.append(new_data)

joint_data = pd.DataFrame(data_list)
joint_data.head()

Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL
0,4198,Dr. Saima Zafar,Professor & HOD,True,saima.zafar@nu.edu.pk,ee,/media/Faculty/98._Dr_Saima_Zafar_Prof._EE.JPG
1,4108,Dr. S.M. Sajid,Professor,True,sm.sajid@nu.edu.pk,ee,/media/Faculty/99._Dr_S_M_Sajid_Prof._EE.JPG
2,5421,Dr. Syed Aun Abbas,Professor,False,aun.abbas@nu.edu.pk,ee,/media/Faculty/100._Dr_Syed_Aun_Abbas_Prof._EE...
3,4609,Dr. Omer Saleem,Associate Professor,True,omer.saleem@nu.edu.pk,ee,/media/Faculty/101._Dr_Omer_Saleem_Associate_P...
4,6942,Dr. Huzaifa Rauf,Assistant Professor,False,huzaifa.rauf@nu.edu.pk,ee,/media/Faculty/Dr._Huzaifa_Rauf-removebg-previ...


## Data import to .csv file

In [11]:
joint_data.to_csv("ee.csv")

## Department of Civil Engineering

In [12]:
URL = "https://lhr.nu.edu.pk/faculty/#cv"
page = requests.get(URL)
print(page)

<Response [200]>


In [13]:
soup = BeautifulSoup(page.content, "html.parser")
soup.find("div", class_="container", id="cv")

<div class="container" id="cv">
<br/>
<h1 class="mb-2 mt-3">Department of Civil Engineering Faculty</h1>
<hr class="mt-0 nu-hr mb-0"/>
<div class="container tab-pane active" id="faculty-tab"><br/>
<div class="row">
<div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/77._Dr_Tauqir_Ahmed_Prof._CvL.jpg"/>
</div>
<div class="card-body pr-0 pl-0 pb-0">
<h5 class="text-center">Dr. Tauqir Ahmed</h5>
<p class="small text-center font-italic">Associate Professor &amp; HOD
                        
                         <br> HEC Approved PhD Supervisor 
                        
                        </br></p>
<p class="mb-0 text-center">tauqir.ahmed@nu.edu.pk</p>
<!--  <p class="mt-0 small text-center">ext no: 417</p> -->
<a class="faculty-link" href="/cv/facultyProfile/5818"></a>
</div>
</div>
</div>
<div class="col-lg-3 col-md-

In [14]:
divs = soup.find(class_="container", id="cv").find_all(
    class_="col-lg-3 col-md-4 col-sm-6 col-12"
)
print(divs)

[<div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/77._Dr_Tauqir_Ahmed_Prof._CvL.jpg"/>
</div>
<div class="card-body pr-0 pl-0 pb-0">
<h5 class="text-center">Dr. Tauqir Ahmed</h5>
<p class="small text-center font-italic">Associate Professor &amp; HOD
                        
                         <br> HEC Approved PhD Supervisor 
                        
                        </br></p>
<p class="mb-0 text-center">tauqir.ahmed@nu.edu.pk</p>
<!--  <p class="mt-0 small text-center">ext no: 417</p> -->
<a class="faculty-link" href="/cv/facultyProfile/5818"></a>
</div>
</div>
</div>, <div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/78._Dr_Shahid_Ali_Prof.

## Data Frame Preparation

In [15]:
joint_data = pd.DataFrame()

data_list = []

for div in divs:
    faculty_link = div.find("a", class_="faculty-link")
    href = faculty_link["href"] if faculty_link else None

    new_data = {
        "ID": href.split("/")[-1] if href else None,
        "Name": (
            div.find("h5", class_="text-center").text.strip()
            if div.find("h5", class_="text-center")
            else None
        ),
        "Designation": (
            div.find("p", class_="small text-center font-italic")
            .get_text(separator=" ", strip=True)
            .split("HEC Approved")[0]
            .strip()
            if div.find("p", class_="small text-center font-italic")
            else None
        ),
        "HEC Approved PHD Supervisor": (
            "HEC Approved"
            in div.find("p", class_="small text-center font-italic").get_text(
                separator=" ", strip=True
            )
            if div.find("p", class_="small text-center font-italic")
            else False
        ),
        "Email": (
            div.find("p", class_="mb-0 text-center").text.strip()
            if div.find("p", class_="mb-0 text-center")
            else None
        ),
        "Department": href.split("/")[1] if href else None,
        "ImageURL": (
            div.find(
                "img", class_="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto"
            ).get("src")
            if div.find(
                "img", class_="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto"
            )
            else None
        ),
    }

    data_list.append(new_data)

joint_data = pd.DataFrame(data_list)
joint_data.head()

Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL
0,5818,Dr. Tauqir Ahmed,Associate Professor & HOD,True,tauqir.ahmed@nu.edu.pk,cv,/media/Faculty/77._Dr_Tauqir_Ahmed_Prof._CvL.jpg
1,9451,Dr. Shahid Ali,Professor,True,shahid.ali@nu.edu.pk,cv,/media/Faculty/78._Dr_Shahid_Ali_Prof._CvL.JPG
2,5705,Dr. Syed Ali Rizwan Bukhari,Professor,True,syed.ali@nu.edu.pk,cv,/media/Faculty/79._Dr_Syed_Ali_Rizwan_Prof._Cv...
3,6941,Dr. Muhammad Azam,Assistant Professor,False,muhammad.azam@nu.edu.pk,cv,/media/Faculty/Dr._Muhammad_Azam-removebg-prev...
4,6047,Dr. Muhammad Umar,Assistant Professor,True,m.umar@nu.edu.pk,cv,/media/Faculty/80._Dr_Muhammad_Umar_Asst._Prof...


## Data import to .csv file

In [16]:
joint_data.to_csv("cv.csv")

## Fast School of Management

In [17]:
URL = "https://lhr.nu.edu.pk/faculty/#fsm"
page = requests.get(URL)
print(page)

<Response [200]>


In [18]:
soup = BeautifulSoup(page.content, "html.parser")
soup.find("div", class_="container", id="fsm")

<div class="container" id="fsm">
<br/>
<h1 class="mb-2 mt-3">FAST School of Management Faculty</h1>
<hr class="mt-0 nu-hr mb-0"/>
<div class="container tab-pane active" id="faculty-tab"><br/>
<div class="row">
<div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/121._Dr_Hamid_Hassan_Prof_MG.JPG"/>
</div>
<div class="card-body pr-0 pl-0 pb-0">
<h5 class="text-center">Dr. Hamid Hassan</h5>
<p class="small text-center font-italic">Professor &amp; HOD
                        
                         <br> HEC Approved PhD Supervisor 
                        
                        </br></p>
<p class="mb-0 text-center">hamid.hassan@nu.edu.pk</p>
<!--  <p class="mt-0 small text-center">ext no: 252</p> -->
<a class="faculty-link" href="/fsm/facultyProfile/3924"></a>
</div>
</div>
</div>
<div class="col-lg-3 col-md-4 col-sm-6 col-

In [19]:
divs = soup.find(class_="container", id="fsm").find_all(
    class_="col-lg-3 col-md-4 col-sm-6 col-12"
)
print(divs)

[<div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/121._Dr_Hamid_Hassan_Prof_MG.JPG"/>
</div>
<div class="card-body pr-0 pl-0 pb-0">
<h5 class="text-center">Dr. Hamid Hassan</h5>
<p class="small text-center font-italic">Professor &amp; HOD
                        
                         <br> HEC Approved PhD Supervisor 
                        
                        </br></p>
<p class="mb-0 text-center">hamid.hassan@nu.edu.pk</p>
<!--  <p class="mt-0 small text-center">ext no: 252</p> -->
<a class="faculty-link" href="/fsm/facultyProfile/3924"></a>
</div>
</div>
</div>, <div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/122.Dr_Akbar_Azam_Assoc._Prof._MG

## Data Frame Preparation

In [20]:
joint_data = pd.DataFrame()

data_list = []

for div in divs:
    faculty_link = div.find("a", class_="faculty-link")
    href = faculty_link["href"] if faculty_link else None

    new_data = {
        "ID": href.split("/")[-1] if href else None,
        "Name": (
            div.find("h5", class_="text-center").text.strip()
            if div.find("h5", class_="text-center")
            else None
        ),
        "Designation": (
            div.find("p", class_="small text-center font-italic")
            .get_text(separator=" ", strip=True)
            .split("HEC Approved")[0]
            .strip()
            if div.find("p", class_="small text-center font-italic")
            else None
        ),
        "HEC Approved PHD Supervisor": (
            "HEC Approved"
            in div.find("p", class_="small text-center font-italic").get_text(
                separator=" ", strip=True
            )
            if div.find("p", class_="small text-center font-italic")
            else False
        ),
        "Email": (
            div.find("p", class_="mb-0 text-center").text.strip()
            if div.find("p", class_="mb-0 text-center")
            else None
        ),
        "Department": href.split("/")[1] if href else None,
        "ImageURL": (
            div.find(
                "img", class_="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto"
            ).get("src")
            if div.find(
                "img", class_="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto"
            )
            else None
        ),
    }

    data_list.append(new_data)

joint_data = pd.DataFrame(data_list)
joint_data.head()

Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL
0,3924,Dr. Hamid Hassan,Professor & HOD,True,hamid.hassan@nu.edu.pk,fsm,/media/Faculty/121._Dr_Hamid_Hassan_Prof_MG.JPG
1,4685,Dr. Akbar Azam,Associate Professor,True,akbar.azam@nu.edu.pk,fsm,/media/Faculty/122.Dr_Akbar_Azam_Assoc._Prof._...
2,6563,Dr. Amna Farrukh,Assistant Professor On Leave,False,amna.farrukh@nu.edu.pk,fsm,/media/Faculty/126._Amna_Farrukh_Assit_Prof._M...
3,5712,Dr. Brig Mujahid Hussain,Assistant Professor,True,mujahid.hussain@nu.edu.pk,fsm,/media/Faculty/128._Dr_Mujahid_Hussain_Asst._P...
4,4629,Dr. Fatima Omer,Assistant Professor,False,fatima.omer@nu.edu.pk,fsm,/media/Faculty/125._Dr_Fatima_Omer_Asst._Prof....


## Data import to .csv file

In [21]:
joint_data.to_csv("fsm.csv")

## Department of Science and Humanities

In [22]:
URL = "https://lhr.nu.edu.pk/faculty/#ss"
page = requests.get(URL)
print(page)

<Response [200]>


In [23]:
soup = BeautifulSoup(page.content, "html.parser")
soup.find("div", class_="container", id="ss")

<div class="container" id="ss">
<br/>
<h1 class="mb-2 mt-3">Department of Science &amp; Humanities Faculty</h1>
<hr class="mt-0 nu-hr mb-0"/>
<div class="container tab-pane active" id="faculty-tab"><br/>
<div class="row">
<div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/149._Dr_Mubashir_Qayyum_Prof._SH.JPG"/>
</div>
<div class="card-body pr-0 pl-0 pb-0">
<h5 class="text-center">Dr. Mubashir Qayyum</h5>
<p class="small text-center font-italic">Professor &amp; HOD
                        
                         <br> HEC Approved PhD Supervisor 
                        
                        </br></p>
<p class="mb-0 text-center">mubashir.qayyum@nu.edu.pk</p>
<!--  <p class="mt-0 small text-center">ext no: 283</p> -->
<a class="faculty-link" href="/ss/facultyProfile/4332"></a>
</div>
</div>
</div>
<div class="col-lg-3 c

In [24]:
divs = soup.find(class_="container", id="ss").find_all(
    class_="col-lg-3 col-md-4 col-sm-6 col-12"
)
print(divs)

[<div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/149._Dr_Mubashir_Qayyum_Prof._SH.JPG"/>
</div>
<div class="card-body pr-0 pl-0 pb-0">
<h5 class="text-center">Dr. Mubashir Qayyum</h5>
<p class="small text-center font-italic">Professor &amp; HOD
                        
                         <br> HEC Approved PhD Supervisor 
                        
                        </br></p>
<p class="mb-0 text-center">mubashir.qayyum@nu.edu.pk</p>
<!--  <p class="mt-0 small text-center">ext no: 283</p> -->
<a class="faculty-link" href="/ss/facultyProfile/4332"></a>
</div>
</div>
</div>, <div class="col-lg-3 col-md-4 col-sm-6 col-12">
<div class="card facultyCard card-br-0 ml-0 mr-0 pb-0">
<div class="facultyImage">
<img class="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto" src="/media/Faculty/150._Dr._Akhlaq_Ahmad_Bh

## Data Frame Preparation

In [25]:
joint_data = pd.DataFrame()

data_list = []

for div in divs:
    faculty_link = div.find("a", class_="faculty-link")
    href = faculty_link["href"] if faculty_link else None

    new_data = {
        "ID": href.split("/")[-1] if href else None,
        "Name": (
            div.find("h5", class_="text-center").text.strip()
            if div.find("h5", class_="text-center")
            else None
        ),
        "Designation": (
            div.find("p", class_="small text-center font-italic")
            .get_text(separator=" ", strip=True)
            .split("HEC Approved")[0]
            .strip()
            if div.find("p", class_="small text-center font-italic")
            else None
        ),
        "HEC Approved PHD Supervisor": (
            "HEC Approved"
            in div.find("p", class_="small text-center font-italic").get_text(
                separator=" ", strip=True
            )
            if div.find("p", class_="small text-center font-italic")
            else False
        ),
        "Email": (
            div.find("p", class_="mb-0 text-center").text.strip()
            if div.find("p", class_="mb-0 text-center")
            else None
        ),
        "Department": href.split("/")[1] if href else None,
        "ImageURL": (
            div.find(
                "img", class_="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto"
            ).get("src")
            if div.find(
                "img", class_="card-img-top rounded-circle mt-3 mb-0 d-block mx-auto"
            )
            else None
        ),
    }

    data_list.append(new_data)

joint_data = pd.DataFrame(data_list)
joint_data.head()

Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL
0,4332,Dr. Mubashir Qayyum,Professor & HOD,True,mubashir.qayyum@nu.edu.pk,ss,/media/Faculty/149._Dr_Mubashir_Qayyum_Prof._S...
1,4020,Dr. Akhlaq Ahmad Bhatti,Professor Dean (Faculty of Sciences & Humanities),True,akhlaq.ahmad@nu.edu.pk,ss,/media/Faculty/150._Dr._Akhlaq_Ahmad_Bhatti_Pr...
2,3712,Dr. Mazhar Hussain,Professor,True,mazhar.hussain@nu.edu.pk,ss,/media/Faculty/151._Dr_Mazhar_Hussain_Prof._SH...
3,4250,Dr. Saman Shahid,Professor,True,saman.shahid@nu.edu.pk,ss,/media/Faculty/152._Dr._Saman_Shahid_Prof._SH.jpg
4,4018,Dr. Summaira Sarfraz,Professor,True,sumaira.sarfraz@nu.edu.pk,ss,/media/Faculty/148._Dr_Summaira_Sarfraz_Prof._...


## Data import to .csv file

In [26]:
joint_data.to_csv("ss.csv")

# **Step#2 Iterator & Data Frame Creation**




## FAST School of Computing Faculty Data

In [27]:
fsc_file = pd.read_csv("fsc.csv")
fsc_new_data_frame = pd.DataFrame(fsc_file)
fsc_new_data_frame.head()

Unnamed: 0.1,Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL
0,0,1238,Dr. Kashif Zafar,Professor & HOD,True,kashif.zafar@nu.edu.pk,fsc,/media/Faculty/01._Dr_Kashif_Zafar_Prof._CS.JPG
1,1,4027,Dr. Aamir Wali,Professor,True,aamir.wali@nu.edu.pk,fsc,/media/Faculty/51._Dr_Aamir_Wali_Prof._AIDS.JPG
2,2,4391,Dr. Asif Mahmood Gillani,Professor,True,asif.gilani@nu.edu.pk,fsc,/media/Faculty/02._Dr_Asif_Mehmood_Gilani_Prof...
3,3,6113,Dr. Asma Naseer,Professor,True,asma.naseer@nu.edu.pk,fsc,/media/Faculty/07._Dr_Asma_Naseer_Assoc._Prof....
4,4,4329,Dr. Zareen Alamgir,Professor,True,zareen.alamgir@nu.edu.pk,fsc,/media/Faculty/03._Dr_Zareen_Alamgir_Prof._CS.JPG


In [28]:
ID_List = fsc_new_data_frame["ID"].tolist()
print(ID_List)

ID_data_frame = pd.DataFrame(columns=["ID", "Extension", "Highest Education"])
ID_data_frame.head()

[1238, 4027, 4391, 6113, 4329, 6968, 9113, 6174, 9540, 5181, 4261, 6048, 5116, 6811, 4236, 6418, 4335, 6667, 4677, 6562, 9539, 6273, 5114, 6302, 6255, 5466, 5424, 3720, 5054, 4234, 4015, 4507, 4239, 5103, 5221, 5115, 4232, 5230, 6172, 6311, 6379, 6924, 6305, 6723, 6553, 6788, 6274, 6308, 6307, 6551, 6419, 6820, 6588, 6277, 6253, 6549, 6560, 6295, 6415, 6114, 6554, 5967, 6552, 6268, 6773, 5986, 6171, 6719, 6925, 6309, 6559, 6722, 6927, 6662, 6928, 6791, 6838, 6422, 6929, 6767, 6718, 6568, 6663, 6943, 6772, 6770, 6176, 6771, 6558]


Unnamed: 0,ID,Extension,Highest Education


## New data Frame

In [29]:
data_list = []

for ID in ID_List:
    URL = f"http://lhr.nu.edu.pk/fsc/facultyProfile/{ID}"
    page = requests.get(URL)
    soup = BeautifulSoup(page.content, "html.parser")

    # Extracting Extension
    extension = "N/A"
    phone_ext = soup.find("span", class_="small")
    if phone_ext and "Ext:" in phone_ext.text:
        extension = phone_ext.text.split("Ext:")[1].strip()

    # Extracting Education (highest degree)
    latest_education = "N/A"
    education_section = soup.find(
        "div", class_="col-lg-8 col-md-6 col-sm-12 text-justify"
    )
    if education_section:
        ul_tag = education_section.find("ul")
        if ul_tag:
            li_tags = ul_tag.find_all("li")
            if li_tags:
                latest_education = li_tags[0].text.strip()

    new_data = {"ID": ID, "Extension": extension, "Highest Education": latest_education}

    data_list.append(new_data)

In [30]:
ID_data_frame = pd.DataFrame(data_list)
ID_data_frame.head()

Unnamed: 0,ID,Extension,Highest Education
0,1238,569,"PhD (CS), NUCES, Islamabad (2010)"
1,4027,572,"PhD (CS), NUCES, Lahore (2019)"
2,4391,558,"Ph.D(Computing), University of Patras , Greece..."
3,6113,634,"PhD (CS), NUCES, Lahore (2018)"
4,4329,612,"Ph.D (CS), NUCES, Lahore (2014)"


## Import to .csv file

In [31]:
ID_data_frame.to_csv("fsc_2.csv")

## Electrical Engineering Faculty Data

In [32]:
ee_file = pd.read_csv("ee.csv")
ee_new_data_frame = pd.DataFrame(ee_file)
ee_new_data_frame.head()

Unnamed: 0.1,Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL
0,0,4198,Dr. Saima Zafar,Professor & HOD,True,saima.zafar@nu.edu.pk,ee,/media/Faculty/98._Dr_Saima_Zafar_Prof._EE.JPG
1,1,4108,Dr. S.M. Sajid,Professor,True,sm.sajid@nu.edu.pk,ee,/media/Faculty/99._Dr_S_M_Sajid_Prof._EE.JPG
2,2,5421,Dr. Syed Aun Abbas,Professor,False,aun.abbas@nu.edu.pk,ee,/media/Faculty/100._Dr_Syed_Aun_Abbas_Prof._EE...
3,3,4609,Dr. Omer Saleem,Associate Professor,True,omer.saleem@nu.edu.pk,ee,/media/Faculty/101._Dr_Omer_Saleem_Associate_P...
4,4,6942,Dr. Huzaifa Rauf,Assistant Professor,False,huzaifa.rauf@nu.edu.pk,ee,/media/Faculty/Dr._Huzaifa_Rauf-removebg-previ...


In [33]:
ID_List = ee_new_data_frame["ID"].tolist()
print(ID_List)

ID_data_frame = pd.DataFrame(columns=["ID", "Extension", "Highest Education"])
ID_data_frame.head()

[4198, 4108, 5421, 4609, 6942, 9452, 4023, 4233, 3669, 3461, 4484, 3778, 7025, 6289, 3779, 5218, 4809, 6843, 5231, 6557, 7005, 6665, 6830, 7002]


Unnamed: 0,ID,Extension,Highest Education


## New data Frame

In [34]:
data_list = []

for ID in ID_List:
    URL = f"http://lhr.nu.edu.pk/ee/facultyProfile/{ID}"
    page = requests.get(URL)
    soup = BeautifulSoup(page.content, "html.parser")

    # Extracting Extension
    extension = "N/A"
    phone_ext = soup.find("span", class_="small")
    if phone_ext and "Ext:" in phone_ext.text:
        extension = phone_ext.text.split("Ext:")[1].strip()

    # Extracting Education (highest degree)
    latest_education = "N/A"
    education_section = soup.find(
        "div", class_="col-lg-8 col-md-6 col-sm-12 text-justify"
    )
    if education_section:
        ul_tag = education_section.find("ul")
        if ul_tag:
            li_tags = ul_tag.find_all("li")
            if li_tags:
                latest_education = li_tags[0].text.strip()

    new_data = {"ID": ID, "Extension": extension, "Highest Education": latest_education}

    data_list.append(new_data)

In [35]:
ID_data_frame = pd.DataFrame(data_list)
ID_data_frame.head()

Unnamed: 0,ID,Extension,Highest Education
0,4198,265,"PhD (Electrical Engineering), UET, Lahore (2011)"
1,4108,315,"PhD (Electrical Engineering), Graz University ..."
2,5421,254,"PhD (Electrical Engineering),Carleton Universi..."
3,4609,364,"PhD (Electrical Engineering), UET, Lahore (2021)"
4,6942,235,"PhD (EE), LUMS, Lahore (2024)"


## Import to .csv file

In [36]:
ID_data_frame.to_csv("ee_2.csv")

## Civil Engineering Faculty Data

In [37]:
cv_file = pd.read_csv("cv.csv")
cv_new_data_frame = pd.DataFrame(cv_file)
cv_new_data_frame.head()

Unnamed: 0.1,Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL
0,0,5818,Dr. Tauqir Ahmed,Associate Professor & HOD,True,tauqir.ahmed@nu.edu.pk,cv,/media/Faculty/77._Dr_Tauqir_Ahmed_Prof._CvL.jpg
1,1,9451,Dr. Shahid Ali,Professor,True,shahid.ali@nu.edu.pk,cv,/media/Faculty/78._Dr_Shahid_Ali_Prof._CvL.JPG
2,2,5705,Dr. Syed Ali Rizwan Bukhari,Professor,True,syed.ali@nu.edu.pk,cv,/media/Faculty/79._Dr_Syed_Ali_Rizwan_Prof._Cv...
3,3,6941,Dr. Muhammad Azam,Assistant Professor,False,muhammad.azam@nu.edu.pk,cv,/media/Faculty/Dr._Muhammad_Azam-removebg-prev...
4,4,6047,Dr. Muhammad Umar,Assistant Professor,True,m.umar@nu.edu.pk,cv,/media/Faculty/80._Dr_Muhammad_Umar_Asst._Prof...


In [38]:
ID_List = cv_new_data_frame["ID"].tolist()
print(ID_List)

ID_data_frame = pd.DataFrame(columns=["ID", "Extension", "Highest Education"])
ID_data_frame.head()

[5818, 9451, 5705, 6941, 6047, 9513, 4592, 5360, 6041, 4300, 6839, 5553, 6573, 6817, 7026, 6818, 6816, 6569, 6934, 6769, 6571, 6933]


Unnamed: 0,ID,Extension,Highest Education


## New data Frame

In [39]:
data_list = []

for ID in ID_List:
    URL = f"http://lhr.nu.edu.pk/cv/facultyProfile/{ID}"
    page = requests.get(URL)
    soup = BeautifulSoup(page.content, "html.parser")

    # Extracting Extension
    extension = "N/A"
    phone_ext = soup.find("span", class_="small")
    if phone_ext and "Ext:" in phone_ext.text:
        extension = phone_ext.text.split("Ext:")[1].strip()

    # Extracting Education (highest degree)
    latest_education = "N/A"
    education_section = soup.find(
        "div", class_="col-lg-8 col-md-6 col-sm-12 text-justify"
    )
    if education_section:
        ul_tag = education_section.find("ul")
        if ul_tag:
            li_tags = ul_tag.find_all("li")
            if li_tags:
                latest_education = li_tags[0].text.strip()

    new_data = {"ID": ID, "Extension": extension, "Highest Education": latest_education}

    data_list.append(new_data)

In [40]:
ID_data_frame = pd.DataFrame(data_list)
ID_data_frame.head()

Unnamed: 0,ID,Extension,Highest Education
0,5818,417,"PhD (Civil Engineering), The University of Tok..."
1,9451,339,"PhD (Hydraulics), Delft University of Technolo..."
2,5705,228,Post-Doctorate (High Early Strength Self-Compa...
3,6941,414,"PhD (Civil Engineering), Universiti Teknologi,..."
4,6047,450,"PhD (Civil Engineering), University of Tokyo, ..."


## Import to .csv file

In [41]:
ID_data_frame.to_csv("cv_2.csv")

## FAST School of Management Faculty Data

In [42]:
fsm_file = pd.read_csv("fsm.csv")
fsm_new_data_frame = pd.DataFrame(fsm_file)
fsm_new_data_frame.head()

Unnamed: 0.1,Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL
0,0,3924,Dr. Hamid Hassan,Professor & HOD,True,hamid.hassan@nu.edu.pk,fsm,/media/Faculty/121._Dr_Hamid_Hassan_Prof_MG.JPG
1,1,4685,Dr. Akbar Azam,Associate Professor,True,akbar.azam@nu.edu.pk,fsm,/media/Faculty/122.Dr_Akbar_Azam_Assoc._Prof._...
2,2,6563,Dr. Amna Farrukh,Assistant Professor On Leave,False,amna.farrukh@nu.edu.pk,fsm,/media/Faculty/126._Amna_Farrukh_Assit_Prof._M...
3,3,5712,Dr. Brig Mujahid Hussain,Assistant Professor,True,mujahid.hussain@nu.edu.pk,fsm,/media/Faculty/128._Dr_Mujahid_Hussain_Asst._P...
4,4,4629,Dr. Fatima Omer,Assistant Professor,False,fatima.omer@nu.edu.pk,fsm,/media/Faculty/125._Dr_Fatima_Omer_Asst._Prof....


In [43]:
ID_List = fsm_new_data_frame["ID"].tolist()
print(ID_List)

ID_data_frame = pd.DataFrame(columns=["ID", "Extension", "Highest Education"])
ID_data_frame.head()

[3924, 4685, 6563, 5712, 4629, 6561, 5423, 5559, 5427, 6426, 9495, 4483, 4647, 5517, 5227, 6930, 5518, 6115, 6709, 6565, 6664, 6812, 6566, 5713, 6813, 6303, 6931, 7016, 7017, 6789, 7015, 6964, 6790, 6815, 6932]


Unnamed: 0,ID,Extension,Highest Education


## New data Frame

In [44]:
data_list = []

for ID in ID_List:
    URL = f"http://lhr.nu.edu.pk/fsm/facultyProfile/{ID}"
    page = requests.get(URL)
    soup = BeautifulSoup(page.content, "html.parser")

    # Extracting Extension
    extension = "N/A"
    phone_ext = soup.find("span", class_="small")
    if phone_ext and "Ext:" in phone_ext.text:
        extension = phone_ext.text.split("Ext:")[1].strip()

    # Extracting Education (highest degree)
    latest_education = "N/A"
    education_section = soup.find(
        "div", class_="col-lg-8 col-md-6 col-sm-12 text-justify"
    )
    if education_section:
        ul_tag = education_section.find("ul")
        if ul_tag:
            li_tags = ul_tag.find_all("li")
            if li_tags:
                latest_education = li_tags[0].text.strip()

    new_data = {"ID": ID, "Extension": extension, "Highest Education": latest_education}

    data_list.append(new_data)

In [45]:
ID_data_frame = pd.DataFrame(data_list)
ID_data_frame.head()

Unnamed: 0,ID,Extension,Highest Education
0,3924,252,"PhD (HRM/Finance), University of Tsukuba, Japa..."
1,4685,343,"PhD (General Management), University of Bologn..."
2,6563,405,"PhD (Engineering Management), Massey Universit..."
3,5712,255,"PhD (Management Science), NUCES, Lahore (2018)"
4,4629,295,"PhD (Management Science), NUCES, Lahore , Paki..."


## Import to .csv file

In [46]:
ID_data_frame.to_csv("fsm_2.csv")

## Department of Science and Humanities Faculty Data

In [47]:
ss_file = pd.read_csv("ss.csv")
ss_new_data_frame = pd.DataFrame(ss_file)
ss_new_data_frame.head()

Unnamed: 0.1,Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL
0,0,4332,Dr. Mubashir Qayyum,Professor & HOD,True,mubashir.qayyum@nu.edu.pk,ss,/media/Faculty/149._Dr_Mubashir_Qayyum_Prof._S...
1,1,4020,Dr. Akhlaq Ahmad Bhatti,Professor Dean (Faculty of Sciences & Humanities),True,akhlaq.ahmad@nu.edu.pk,ss,/media/Faculty/150._Dr._Akhlaq_Ahmad_Bhatti_Pr...
2,2,3712,Dr. Mazhar Hussain,Professor,True,mazhar.hussain@nu.edu.pk,ss,/media/Faculty/151._Dr_Mazhar_Hussain_Prof._SH...
3,3,4250,Dr. Saman Shahid,Professor,True,saman.shahid@nu.edu.pk,ss,/media/Faculty/152._Dr._Saman_Shahid_Prof._SH.jpg
4,4,4018,Dr. Summaira Sarfraz,Professor,True,sumaira.sarfraz@nu.edu.pk,ss,/media/Faculty/148._Dr_Summaira_Sarfraz_Prof._...


In [48]:
ID_List = ss_new_data_frame["ID"].tolist()
print(ID_List)

ID_data_frame = pd.DataFrame(columns=["ID", "Extension", "Highest Education"])
ID_data_frame.head()

[4332, 4020, 3712, 4250, 4018, 4584, 1250, 4608, 9172, 6768, 5437, 6926, 9173, 4243, 4244, 4245, 5438, 5622, 6555, 5203, 4397, 6421, 6365, 6178, 6420, 5795, 6548, 5337, 6363, 6567]


Unnamed: 0,ID,Extension,Highest Education


## New data Frame

In [49]:
data_list = []

for ID in ID_List:
    URL = f"http://lhr.nu.edu.pk/ss/facultyProfile/{ID}"
    page = requests.get(URL)
    soup = BeautifulSoup(page.content, "html.parser")

    # Extracting Extension
    extension = "N/A"
    phone_ext = soup.find("span", class_="small")
    if phone_ext and "Ext:" in phone_ext.text:
        extension = phone_ext.text.split("Ext:")[1].strip()

    # Extracting Education (highest degree)
    latest_education = "N/A"
    education_section = soup.find(
        "div", class_="col-lg-8 col-md-6 col-sm-12 text-justify"
    )
    if education_section:
        ul_tag = education_section.find("ul")
        if ul_tag:
            li_tags = ul_tag.find_all("li")
            if li_tags:
                latest_education = li_tags[0].text.strip()

    new_data = {"ID": ID, "Extension": extension, "Highest Education": latest_education}

    data_list.append(new_data)

In [50]:
ID_data_frame = pd.DataFrame(data_list)
ID_data_frame.head()

Unnamed: 0,ID,Extension,Highest Education
0,4332,283,"PhD (Applied Mathematics), NUCES, Peshawar (2018)"
1,4020,284,"PhD (Mathematics/ Hypergraph Theory), GCU Laho..."
2,3712,313,"PhD (Mathematics), QAU, Islamabad (2008)"
3,4250,206,"PhD (Environmental Science), PU, Lahore (2015)"
4,4018,227,"PhD (English), AJ&K University, Pakistan (2013)"


## Import to .csv file

In [51]:
ID_data_frame.to_csv("ss_2.csv")

# **Step#3 Data Integration**




## FAST School of Computing

In [52]:
fsc_temp = pd.read_csv("fsc.csv")
fsc_2_temp = pd.read_csv("fsc_2.csv")

merged_df_fsc = pd.merge(fsc_temp, fsc_2_temp, on="ID", how="left")
merged_df_fsc = merged_df_fsc.drop(columns=["Unnamed: 0_x", "Unnamed: 0_y"])

merged_df_fsc.head()

Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL,Extension,Highest Education
0,1238,Dr. Kashif Zafar,Professor & HOD,True,kashif.zafar@nu.edu.pk,fsc,/media/Faculty/01._Dr_Kashif_Zafar_Prof._CS.JPG,569.0,"PhD (CS), NUCES, Islamabad (2010)"
1,4027,Dr. Aamir Wali,Professor,True,aamir.wali@nu.edu.pk,fsc,/media/Faculty/51._Dr_Aamir_Wali_Prof._AIDS.JPG,572.0,"PhD (CS), NUCES, Lahore (2019)"
2,4391,Dr. Asif Mahmood Gillani,Professor,True,asif.gilani@nu.edu.pk,fsc,/media/Faculty/02._Dr_Asif_Mehmood_Gilani_Prof...,558.0,"Ph.D(Computing), University of Patras , Greece..."
3,6113,Dr. Asma Naseer,Professor,True,asma.naseer@nu.edu.pk,fsc,/media/Faculty/07._Dr_Asma_Naseer_Assoc._Prof....,634.0,"PhD (CS), NUCES, Lahore (2018)"
4,4329,Dr. Zareen Alamgir,Professor,True,zareen.alamgir@nu.edu.pk,fsc,/media/Faculty/03._Dr_Zareen_Alamgir_Prof._CS.JPG,612.0,"Ph.D (CS), NUCES, Lahore (2014)"


## Department of Electrical Engineering

In [53]:
ee_temp = pd.read_csv("ee.csv")
ee_2_temp = pd.read_csv("ee_2.csv")

merged_df_ee = pd.merge(ee_temp, ee_2_temp, on="ID", how="left")
merged_df_ee = merged_df_ee.drop(columns=["Unnamed: 0_x", "Unnamed: 0_y"])

merged_df_ee.head()

Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL,Extension,Highest Education
0,4198,Dr. Saima Zafar,Professor & HOD,True,saima.zafar@nu.edu.pk,ee,/media/Faculty/98._Dr_Saima_Zafar_Prof._EE.JPG,265.0,"PhD (Electrical Engineering), UET, Lahore (2011)"
1,4108,Dr. S.M. Sajid,Professor,True,sm.sajid@nu.edu.pk,ee,/media/Faculty/99._Dr_S_M_Sajid_Prof._EE.JPG,315.0,"PhD (Electrical Engineering), Graz University ..."
2,5421,Dr. Syed Aun Abbas,Professor,False,aun.abbas@nu.edu.pk,ee,/media/Faculty/100._Dr_Syed_Aun_Abbas_Prof._EE...,254.0,"PhD (Electrical Engineering),Carleton Universi..."
3,4609,Dr. Omer Saleem,Associate Professor,True,omer.saleem@nu.edu.pk,ee,/media/Faculty/101._Dr_Omer_Saleem_Associate_P...,364.0,"PhD (Electrical Engineering), UET, Lahore (2021)"
4,6942,Dr. Huzaifa Rauf,Assistant Professor,False,huzaifa.rauf@nu.edu.pk,ee,/media/Faculty/Dr._Huzaifa_Rauf-removebg-previ...,235.0,"PhD (EE), LUMS, Lahore (2024)"


## Department of Civil Engineering

In [54]:
cv_temp = pd.read_csv("cv.csv")
cv_2_temp = pd.read_csv("cv_2.csv")

merged_df_cv = pd.merge(cv_temp, cv_2_temp, on="ID", how="left")
merged_df_cv = merged_df_cv.drop(columns=["Unnamed: 0_x", "Unnamed: 0_y"])

merged_df_cv.head()

Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL,Extension,Highest Education
0,5818,Dr. Tauqir Ahmed,Associate Professor & HOD,True,tauqir.ahmed@nu.edu.pk,cv,/media/Faculty/77._Dr_Tauqir_Ahmed_Prof._CvL.jpg,417.0,"PhD (Civil Engineering), The University of Tok..."
1,9451,Dr. Shahid Ali,Professor,True,shahid.ali@nu.edu.pk,cv,/media/Faculty/78._Dr_Shahid_Ali_Prof._CvL.JPG,339.0,"PhD (Hydraulics), Delft University of Technolo..."
2,5705,Dr. Syed Ali Rizwan Bukhari,Professor,True,syed.ali@nu.edu.pk,cv,/media/Faculty/79._Dr_Syed_Ali_Rizwan_Prof._Cv...,228.0,Post-Doctorate (High Early Strength Self-Compa...
3,6941,Dr. Muhammad Azam,Assistant Professor,False,muhammad.azam@nu.edu.pk,cv,/media/Faculty/Dr._Muhammad_Azam-removebg-prev...,414.0,"PhD (Civil Engineering), Universiti Teknologi,..."
4,6047,Dr. Muhammad Umar,Assistant Professor,True,m.umar@nu.edu.pk,cv,/media/Faculty/80._Dr_Muhammad_Umar_Asst._Prof...,450.0,"PhD (Civil Engineering), University of Tokyo, ..."


## FAST School of Management

In [55]:
fsm_temp = pd.read_csv("fsm.csv")
fsm_2_temp = pd.read_csv("fsm_2.csv")

merged_df_fsm = pd.merge(fsm_temp, fsm_2_temp, on="ID", how="left")
merged_df_fsm = merged_df_fsm.drop(columns=["Unnamed: 0_x", "Unnamed: 0_y"])

merged_df_fsm.head()

Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL,Extension,Highest Education
0,3924,Dr. Hamid Hassan,Professor & HOD,True,hamid.hassan@nu.edu.pk,fsm,/media/Faculty/121._Dr_Hamid_Hassan_Prof_MG.JPG,252.0,"PhD (HRM/Finance), University of Tsukuba, Japa..."
1,4685,Dr. Akbar Azam,Associate Professor,True,akbar.azam@nu.edu.pk,fsm,/media/Faculty/122.Dr_Akbar_Azam_Assoc._Prof._...,343.0,"PhD (General Management), University of Bologn..."
2,6563,Dr. Amna Farrukh,Assistant Professor On Leave,False,amna.farrukh@nu.edu.pk,fsm,/media/Faculty/126._Amna_Farrukh_Assit_Prof._M...,405.0,"PhD (Engineering Management), Massey Universit..."
3,5712,Dr. Brig Mujahid Hussain,Assistant Professor,True,mujahid.hussain@nu.edu.pk,fsm,/media/Faculty/128._Dr_Mujahid_Hussain_Asst._P...,255.0,"PhD (Management Science), NUCES, Lahore (2018)"
4,4629,Dr. Fatima Omer,Assistant Professor,False,fatima.omer@nu.edu.pk,fsm,/media/Faculty/125._Dr_Fatima_Omer_Asst._Prof....,295.0,"PhD (Management Science), NUCES, Lahore , Paki..."


## Department of Science and Humanities

In [56]:
ss_temp = pd.read_csv("ss.csv")
ss_2_temp = pd.read_csv("ss_2.csv")

merged_df_ss = pd.merge(ss_temp, ss_2_temp, on="ID", how="left")
merged_df_ss = merged_df_ss.drop(columns=["Unnamed: 0_x", "Unnamed: 0_y"])

merged_df_ss.head()

Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL,Extension,Highest Education
0,4332,Dr. Mubashir Qayyum,Professor & HOD,True,mubashir.qayyum@nu.edu.pk,ss,/media/Faculty/149._Dr_Mubashir_Qayyum_Prof._S...,283.0,"PhD (Applied Mathematics), NUCES, Peshawar (2018)"
1,4020,Dr. Akhlaq Ahmad Bhatti,Professor Dean (Faculty of Sciences & Humanities),True,akhlaq.ahmad@nu.edu.pk,ss,/media/Faculty/150._Dr._Akhlaq_Ahmad_Bhatti_Pr...,284.0,"PhD (Mathematics/ Hypergraph Theory), GCU Laho..."
2,3712,Dr. Mazhar Hussain,Professor,True,mazhar.hussain@nu.edu.pk,ss,/media/Faculty/151._Dr_Mazhar_Hussain_Prof._SH...,313.0,"PhD (Mathematics), QAU, Islamabad (2008)"
3,4250,Dr. Saman Shahid,Professor,True,saman.shahid@nu.edu.pk,ss,/media/Faculty/152._Dr._Saman_Shahid_Prof._SH.jpg,206.0,"PhD (Environmental Science), PU, Lahore (2015)"
4,4018,Dr. Summaira Sarfraz,Professor,True,sumaira.sarfraz@nu.edu.pk,ss,/media/Faculty/148._Dr_Summaira_Sarfraz_Prof._...,227.0,"PhD (English), AJ&K University, Pakistan (2013)"


## Final Data File

In [57]:
# Concatenation of all the merged DataFrames
final_df = pd.concat(
    [merged_df_fsc, merged_df_ee, merged_df_cv, merged_df_fsm, merged_df_ss],
    ignore_index=True,
)
final_df.to_csv("fast_lhr_faculty.csv", index=False)

final_df.head()

Unnamed: 0,ID,Name,Designation,HEC Approved PHD Supervisor,Email,Department,ImageURL,Extension,Highest Education
0,1238,Dr. Kashif Zafar,Professor & HOD,True,kashif.zafar@nu.edu.pk,fsc,/media/Faculty/01._Dr_Kashif_Zafar_Prof._CS.JPG,569.0,"PhD (CS), NUCES, Islamabad (2010)"
1,4027,Dr. Aamir Wali,Professor,True,aamir.wali@nu.edu.pk,fsc,/media/Faculty/51._Dr_Aamir_Wali_Prof._AIDS.JPG,572.0,"PhD (CS), NUCES, Lahore (2019)"
2,4391,Dr. Asif Mahmood Gillani,Professor,True,asif.gilani@nu.edu.pk,fsc,/media/Faculty/02._Dr_Asif_Mehmood_Gilani_Prof...,558.0,"Ph.D(Computing), University of Patras , Greece..."
3,6113,Dr. Asma Naseer,Professor,True,asma.naseer@nu.edu.pk,fsc,/media/Faculty/07._Dr_Asma_Naseer_Assoc._Prof....,634.0,"PhD (CS), NUCES, Lahore (2018)"
4,4329,Dr. Zareen Alamgir,Professor,True,zareen.alamgir@nu.edu.pk,fsc,/media/Faculty/03._Dr_Zareen_Alamgir_Prof._CS.JPG,612.0,"Ph.D (CS), NUCES, Lahore (2014)"
