/
passoptnew.py
129 lines (68 loc) · 1.86 KB
/
passoptnew.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
import pandas as pd
import numpy as np
import math
from astropy import units as u
from astropy.coordinates import SkyCoord
from joblib import Parallel, delayed
import multiprocessing
def filereader(filename):
df1 = pd.read_csv(filename)
return df1
def pass1(i,j):
print i,j
arr = []
x = df['X'][i] * df['X'][j]
y = df['Y'][i] * df['Y'][j]
z = df['Z'][i] * df['Z'][j]
tot = x + y + z
if tot >1:
tot = 1
angle = math.acos(tot)
arcsec = angle * ((180/math.pi) * 3600)
'''
print arcsec
'''
#print angle,arcsec," i j ", i , j
if arcsec < 1 :
return (i,j)
else:
return None
def filewriter(data_f2,data_f3):
writename = '~/Data/NonDuplicate2GG.csv'
data_f2.to_csv(writename,sep=',')
writename2 = '~/Data/Duplicate2GG.csv'
data_f3.to_csv(writename2,sep=',')
def data_split(arr):
'''
num2 = df.values
num2 = np.delete(num2,)
'''
df2 = df
df3 = df
#print arr
df2 = df2.drop([i for i in arr])
df3 = df3.drop([i for i in xrange(0,len(df)) if i not in arr])
return (df2,df3)
if __name__ == "__main__":
filename = '~/Data/OPTDATA.csv'
global df
df = filereader(filename)
num_cores = multiprocessing.cpu_count()
results_i = Parallel(n_jobs=num_cores, backend="multiprocessing")(delayed(pass1)(i,j) for i in xrange(0,len(df)-1) for j in xrange((i+1),(len(df)))) #xrange((i+1)
#results2 = way2(data_frame1)
#print results_i
results_i = np.unique(results_i)
#print results_i
results_i = np.delete(results_i,0)
liss_i = [ x[0] for x in results_i ]
liss_i = np.asarray(liss_i)
liss_j = [ x[1] for x in results_i]
liss_j = np.asarray(liss_j)
results_i = np.concatenate([liss_i,liss_j])
results_i = np.unique(results_i)
#print results_i
#print len(results_i)
#print results_i
data_frame2 , data_frame3 = data_split(results_i)
filewriter(data_frame2,data_frame3)
#print results_i