In [1]:
import numpy as np

# 文件路径
path = '/data/hanzhe/20250424cs/ICE_data/example_1_data_ICE_GM.npz'

# 加载 .npz 文件
# 如果你的文件里保存的是 Python 对象，也可以加上 allow_pickle=True
data = np.load(path, allow_pickle=False)

# 打印包含的所有数组的名字
print("Available arrays:", data.files)

# 依次打印每个数组的 shape 和 dtype
for name in data.files:
    arr = data[name]
    print(f"Array name: {name}")
    print(f"  Shape: {arr.shape}")
    print(f"  Dtype: {arr.dtype}")
    print("-" * 40)


Available arrays: ['X', 'y']
Array name: X
  Shape: (2000, 100)
  Dtype: float64
----------------------------------------
Array name: y
  Shape: (2000,)
  Dtype: float64
----------------------------------------


In [2]:
import numpy as np
import os

# 输入 .npz 文件路径
npz_path = '/data/hanzhe/20250424cs/ICE_data/example_1_data_ICE_GM.npz'

# 输出目录（可以改成你想要的路径）
out_dir = '/data/hanzhe/20250424cs/ICE_data/ICE_GM'

# 确保输出目录存在
os.makedirs(out_dir, exist_ok=True)

# 加载 .npz 文件
data = np.load(npz_path, allow_pickle=False)

# 读取 X 和 y
X = data['X']
y = data['y']

# 保存为 .npy
np.save(os.path.join(out_dir, 'X_ICE_GM.npy'), X)
np.save(os.path.join(out_dir, 'y_ICE_GM.npy'), y)

print(f"Saved X.npy with shape {X.shape} and dtype {X.dtype}")
print(f"Saved y.npy with shape {y.shape} and dtype {y.dtype}")


Saved X.npy with shape (2000, 100) and dtype float64
Saved y.npy with shape (2000,) and dtype float64


In [3]:
import numpy as np
import os

# 输入 .npz 文件路径
npz_path = '/data/hanzhe/20250424cs/ICE_data/example_1_data_ICE_SG.npz'

# 输出目录（可以改成你想要的路径）
out_dir = '/data/hanzhe/20250424cs/ICE_data/ICE_SG'

# 确保输出目录存在
os.makedirs(out_dir, exist_ok=True)

# 加载 .npz 文件
data = np.load(npz_path, allow_pickle=False)

# 读取 X 和 y
X = data['X']
y = data['y']

# 保存为 .npy
np.save(os.path.join(out_dir, 'X_ICE_SG.npy'), X)
np.save(os.path.join(out_dir, 'y_ICE_SG.npy'), y)

print(f"Saved X.npy with shape {X.shape} and dtype {X.dtype}")
print(f"Saved y.npy with shape {y.shape} and dtype {y.dtype}")


Saved X.npy with shape (2000, 100) and dtype float64
Saved y.npy with shape (2000,) and dtype float64


In [4]:
import numpy as np
import os

# 输入 .npz 文件路径
npz_path = '/data/hanzhe/20250424cs/ICE_data/example_1_data_ICE_vMFNM.npz'

# 输出目录（可以改成你想要的路径）
out_dir = '/data/hanzhe/20250424cs/ICE_data/ICE_vMFNM'

# 确保输出目录存在
os.makedirs(out_dir, exist_ok=True)

# 加载 .npz 文件
data = np.load(npz_path, allow_pickle=False)

# 读取 X 和 y
X = data['X']
y = data['y']

# 保存为 .npy
np.save(os.path.join(out_dir, 'X_ICE_vMFNM.npy'), X)
np.save(os.path.join(out_dir, 'y_ICE_vMFNM.npy'), y)

print(f"Saved X.npy with shape {X.shape} and dtype {X.dtype}")
print(f"Saved y.npy with shape {y.shape} and dtype {y.dtype}")


Saved X.npy with shape (2000, 100) and dtype float64
Saved y.npy with shape (2000,) and dtype float64


In [5]:
#!/usr/bin/env python
# coding: utf-8
"""
读取 y_ICE_GM.npy 并生成二值标签，统计 0 的数量
----------------------------------------
依赖:
  pip install numpy
"""

import os
import numpy as np

# ───────── 1. 读取原始 y ─────────
y_path = '/data/hanzhe/20250424cs/ICE_data/ICE_GM/y_ICE_GM.npy'
y = np.load(y_path)   # (n_samples,)

# ───────── 2. 统计原始分布 ─────────
total = y.size
num_pos = np.sum(y > 0)
num_neg = np.sum(y < 0)
num_zero = np.sum(y == 0)

print(f"Total samples: {total}")
print(f"  > 0: {num_pos}")
print(f"  = 0: {num_zero}")
print(f"  < 0: {num_neg}")

# ───────── 3. 生成二值标签 ─────────
#    new_y = 1 if y > 0, else 0
binary_y = (y > 0).astype(int)

# ───────── 4. 统计二值标签中的 0 数量 ─────────
num_binary_zero = np.sum(binary_y == 0)
num_binary_one  = np.sum(binary_y == 1)

print(f"\nAfter binarization (>0→1, ≤0→0):")
print(f"  zeros (0): {num_binary_zero}")
print(f"  ones  (1): {num_binary_one}")

# （可选）保存二值标签
out_dir = os.path.dirname(y_path)
out_path = os.path.join(out_dir, 'y_ICE_GM_binary.npy')
np.save(out_path, binary_y)
print(f"\nSaved binarized labels to: {out_path}")


Total samples: 2000
  > 0: 2000
  = 0: 0
  < 0: 0

After binarization (>0→1, ≤0→0):
  zeros (0): 0
  ones  (1): 2000

Saved binarized labels to: /data/hanzhe/20250424cs/ICE_data/ICE_GM/y_ICE_GM_binary.npy


In [7]:
#!/usr/bin/env python
# coding: utf-8
"""
读取 y_ICE_GM.npy 并生成二值标签，统计 0 的数量
----------------------------------------
依赖:
  pip install numpy
"""

import os
import numpy as np

# ───────── 1. 读取原始 y ─────────
y_path = '/data/hanzhe/20250424cs/ICE_data/ICE_vMFNM/y_ICE_vMFNM.npy'
y = np.load(y_path)   # (n_samples,)

# ───────── 2. 统计原始分布 ─────────
total = y.size
num_pos = np.sum(y > 0)
num_neg = np.sum(y < 0)
num_zero = np.sum(y == 0)

print(f"Total samples: {total}")
print(f"  > 0: {num_pos}")
print(f"  = 0: {num_zero}")
print(f"  < 0: {num_neg}")

# ───────── 3. 生成二值标签 ─────────
#    new_y = 1 if y > 0, else 0
binary_y = (y > 0).astype(int)

# ───────── 4. 统计二值标签中的 0 数量 ─────────
num_binary_zero = np.sum(binary_y == 0)
num_binary_one  = np.sum(binary_y == 1)

print(f"\nAfter binarization (>0→1, ≤0→0):")
print(f"  zeros (0): {num_binary_zero}")
print(f"  ones  (1): {num_binary_one}")

# （可选）保存二值标签
out_dir = os.path.dirname(y_path)
out_path = os.path.join(out_dir, 'y_ICE_GM_binary.npy')
np.save(out_path, binary_y)
print(f"\nSaved binarized labels to: {out_path}")


Total samples: 2000
  > 0: 845
  = 0: 0
  < 0: 1155

After binarization (>0→1, ≤0→0):
  zeros (0): 1155
  ones  (1): 845

Saved binarized labels to: /data/hanzhe/20250424cs/ICE_data/ICE_vMFNM/y_ICE_GM_binary.npy
