In [1]:
import datasets
import pandas as pd

In [2]:
SwaRD = datasets.load_from_disk('../../datasets_with_data/SwaRD/')

In [3]:
sub_columns = ['REQID_expanded', 'Project Name', 'Requirement Sentences', 'isReqSysAuxContAux']
SwaRD_df = SwaRD.to_pandas()[sub_columns] # remove [[.....]], if you want to see all columns

In [4]:
sampled = (
    SwaRD_df
    .groupby("isReqSysAuxContAux", group_keys = False)
    .apply(lambda x: x.sample(n = min(10, len(x)), random_state = 100))
    .style
    .hide(axis = "index")
    # general styling for all cells
    .set_properties(**{
        "text-align": "left",
        "direction": "ltr",
        "font-size": "12px",
        "line-height": "1.2",
        "padding": "4px",
        "vertical-align": "top"
    })
    .set_table_styles([
        {"selector": "table", "props": [
            ("table-layout", "fixed"),
            ("width", "100%"),
            ("border-collapse", "collapse")
        ]},
        {"selector": "th", "props": [
            ("text-align", "left"),
            ("direction", "ltr"),
            ("font-size", "12px"),
            ("padding", "4px")
        ]}
    ])
    # wrap ONLY the requirement text column
    .set_properties(
        subset = ['Requirement Sentences'],  
        **{
            "white-space": "normal",
            "word-break": "break-word",
            "max-width": "450px"
        }
    )
    .set_properties(
        subset = ['Project Name'],
        **{
            "white-space": "normal",
            "word-break": "break-word",
            "max-width": "200px"
        }
    )
)


In [5]:
sampled

REQID_expanded,Project Name,Requirement Sentences,isReqSysAuxContAux
38560,A Dataset of Crowdsourced Smarthome Requirements with Creativity Ratings,It is the middle of the afternoon on a bright day.,contextual_auxiliary
36735,A Dataset of Crowdsourced Smarthome Requirements with Creativity Ratings,"However, it was just Daylights Saving Time so all the clocks changed by an hour.",contextual_auxiliary
19348,IlmSeven,We should not support them for projects being built with 3.,contextual_auxiliary
24717,IlmSeven,How do we tell which jobs failed and which didn't?,contextual_auxiliary
37648,A Dataset of Crowdsourced Smarthome Requirements with Creativity Ratings,A owl catches a mouse on top of my driveway.,contextual_auxiliary
7210,IlmSeven,It would be nice if there was a place to put complex queries.,contextual_auxiliary
21655,IlmSeven,The original idea of toolchains was to have the same tool being used by different plugins within the same project.,contextual_auxiliary
36837,A Dataset of Crowdsourced Smarthome Requirements with Creativity Ratings,I get out of bed and walk toward the door.,contextual_auxiliary
7216,IlmSeven,"In Derby, a statement which times out when executed with Statement.",contextual_auxiliary
36400,A Dataset of Crowdsourced Smarthome Requirements with Creativity Ratings,I get to the driveway of my house and stand there for a bit talking on the phone.,contextual_auxiliary
