-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgroupcat.py
165 lines (119 loc) · 5.52 KB
/
groupcat.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
""" Modifeld groupcat.py file from Illustris Simulation: Public Data Release.
groupcat.py: File I/O related to the FoF and Subfind group catalogs.
Because I changed some of directory names and file locations. I leave the
offset file in the group directory is the main thing.
"""
import six
import os
import numpy as np
import h5py
def gcPath(basePath, snapNum, chunkNum=0):
""" Return absolute path to a group catalog HDF5 file (modify as needed). """
if snapNum < 10:
snapstr='00'+str(snapNum)
elif snapNum < 100:
snapstr='0'+str(snapNum)
else:
snapstr=str(snapNum)
gcPath = basePath + '/groups_{}/'.format(snapstr)
filePath1 = gcPath + 'groups_{}.{}.hdf5'.format(snapstr, chunkNum)
filePath2 = gcPath + 'fof_subhalo_tab_{}.{}.hdf5'.format(snapstr, chunkNum)
if os.path.isfile(filePath1):
return filePath1
return filePath2
def offsetPath(basePath, snapNum):
""" Return absolute path to a separate offset file (modify as needed). """
offsetPath = basePath + '/groups_%03d/offsets_%03d.hdf5' % snapNum
return offsetPath
def loadObjects(basePath, snapNum, gName, nName, fields):
""" Load either halo or subhalo information from the group catalog. """
result = {}
# make sure fields is not a single element
if isinstance(fields, six.string_types):
fields = [fields]
# load header from first chunk
with h5py.File(gcPath(basePath, snapNum), 'r') as f:
header = dict(f['Header'].attrs.items())
result['count'] = f['Header'].attrs['N' + nName + '_Total']
if not result['count']:
print('warning: zero groups, empty return (snap=' + str(snapNum) + ').')
return result
# if fields not specified, load everything
if not fields:
fields = list(f[gName].keys())
for field in fields:
# verify existence
if field not in f[gName].keys():
raise Exception("Group catalog does not have requested field [" + field + "]!")
# replace local length with global
shape = list(f[gName][field].shape)
shape[0] = result['count']
# allocate within return dict
result[field] = np.zeros(shape, dtype=f[gName][field].dtype)
# loop over chunks
wOffset = 0
for i in range(header['NumFiles']):
f = h5py.File(gcPath(basePath, snapNum, i), 'r')
if not f['Header'].attrs['N'+nName+'_ThisFile']:
continue # empty file chunk
# loop over each requested field
for field in fields:
if field not in f[gName].keys():
raise Exception("Group catalog does not have requested field [" + field + "]!")
# shape and type
shape = f[gName][field].shape
# read data local to the current file
if len(shape) == 1:
result[field][wOffset:wOffset+shape[0]] = f[gName][field][0:shape[0]]
else:
result[field][wOffset:wOffset+shape[0], :] = f[gName][field][0:shape[0], :]
wOffset += shape[0]
f.close()
# only a single field? then return the array instead of a single item dict
if len(fields) == 1:
return result[fields[0]]
return result
def loadSubhalos(basePath, snapNum, fields=None):
""" Load all subhalo information from the entire group catalog for one snapshot
(optionally restrict to a subset given by fields). """
return loadObjects(basePath, snapNum, "Subhalo", "subgroups", fields)
def loadHalos(basePath, snapNum, fields=None):
""" Load all halo information from the entire group catalog for one snapshot
(optionally restrict to a subset given by fields). """
return loadObjects(basePath, snapNum, "Group", "groups", fields)
def loadHeader(basePath, snapNum):
""" Load the group catalog header. """
with h5py.File(gcPath(basePath, snapNum), 'r') as f:
header = dict(f['Header'].attrs.items())
return header
def load(basePath, snapNum):
""" Load complete group catalog all at once. """
r = {}
r['subhalos'] = loadSubhalos(basePath, snapNum)
r['halos'] = loadHalos(basePath, snapNum)
r['header'] = loadHeader(basePath, snapNum)
return r
def loadSingle(basePath, snapNum, haloID=-1, subhaloID=-1):
""" Return complete group catalog information for one halo or subhalo. """
if (haloID < 0 and subhaloID < 0) or (haloID >= 0 and subhaloID >= 0):
raise Exception("Must specify either haloID or subhaloID (and not both).")
gName = "Subhalo" if subhaloID >= 0 else "Group"
searchID = subhaloID if subhaloID >= 0 else haloID
# old or new format
if 'fof_subhalo' in gcPath(basePath, snapNum):
# use separate 'offsets_nnn.hdf5' files
with h5py.File(offsetPath(basePath, snapNum), 'r') as f:
offsets = f['FileOffsets/'+gName][()]
else:
# use header of group catalog
with h5py.File(gcPath(basePath, snapNum), 'r') as f:
offsets = f['Header'].attrs['FileOffsets_'+gName]
offsets = searchID - offsets
fileNum = np.max(np.where(offsets >= 0))
groupOffset = offsets[fileNum]
# load halo/subhalo fields into a dict
result = {}
with h5py.File(gcPath(basePath, snapNum, fileNum), 'r') as f:
for haloProp in f[gName].keys():
result[haloProp] = f[gName][haloProp][groupOffset]
return result