structure.ts 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371
  1. /**
  2. * Copyright (c) 2017 mol* contributors, licensed under MIT, See LICENSE file for more info.
  3. *
  4. * @author David Sehnal <david.sehnal@gmail.com>
  5. */
  6. import * as B from 'benchmark'
  7. import * as util from 'util'
  8. import * as fs from 'fs'
  9. import CIF from 'mol-io/reader/cif'
  10. import { Structure, Model, Queries as Q, Atom, AtomGroup, AtomSet, Selection, Symmetry } from 'mol-model/structure'
  11. import { Segmentation } from 'mol-data/int'
  12. import to_mmCIF from 'mol-model/structure/export/mmcif'
  13. require('util.promisify').shim();
  14. const readFileAsync = util.promisify(fs.readFile);
  15. async function readData(path: string) {
  16. if (path.match(/\.bcif$/)) {
  17. const input = await readFileAsync(path)
  18. const data = new Uint8Array(input.byteLength);
  19. for (let i = 0; i < input.byteLength; i++) data[i] = input[i];
  20. return data;
  21. } else {
  22. return readFileAsync(path, 'utf8');
  23. }
  24. }
  25. function *test() {
  26. yield 10;
  27. return 15;
  28. }
  29. async function runIt<T>(itP: () => IterableIterator<T>) {
  30. const it = itP();
  31. let lastValue: T | undefined;
  32. while(true) {
  33. const { value, done } = it.next();
  34. if (done) return value;
  35. lastValue = value;
  36. }
  37. }
  38. runIt(test).then(r => console.log('rerdasdasda', r))
  39. export async function readCIF(path: string) {
  40. console.time('readData');
  41. const input = await readData(path)
  42. console.timeEnd('readData');
  43. console.time('parse');
  44. const comp = typeof input === 'string' ? CIF.parseText(input) : CIF.parseBinary(input);
  45. const parsed = await comp();
  46. console.timeEnd('parse');
  47. if (parsed.isError) {
  48. throw parsed;
  49. }
  50. const data = parsed.result.blocks[0];
  51. console.time('schema')
  52. const mmcif = CIF.schema.mmCIF(data);
  53. console.timeEnd('schema')
  54. console.time('buildModels')
  55. const models = Model.create({ kind: 'mmCIF', data: mmcif });
  56. console.timeEnd('buildModels')
  57. const structures = models.map(Structure.ofModel);
  58. return { mmcif, models, structures };
  59. }
  60. export namespace PropertyAccess {
  61. function baseline(model: Model) {
  62. const atom_site = model.sourceData.data.atom_site;
  63. const id = atom_site.id.value;
  64. let s = 0;
  65. for (let i = 0, _i = atom_site._rowCount; i < _i; i++) {
  66. s += id(i);
  67. }
  68. return s;
  69. }
  70. function sumProperty(structure: Structure, p: Atom.Property<number>) {
  71. const { atoms, units } = structure;
  72. const unitIds = AtomSet.unitIds(atoms);
  73. const l = Atom.Location();
  74. let s = 0;
  75. for (let i = 0, _i = unitIds.length; i < _i; i++) {
  76. l.unit = units[unitIds[i]];
  77. const set = AtomSet.unitGetByIndex(atoms, i);
  78. for (let j = 0, _j = AtomGroup.size(set); j < _j; j++) {
  79. l.atom = AtomGroup.getAt(set, j);
  80. s += p(l);
  81. }
  82. }
  83. return s;
  84. }
  85. function sumPropertySegmented(structure: Structure, p: Atom.Property<number>) {
  86. const { atoms, units } = structure;
  87. const unitIds = AtomSet.unitIds(atoms);
  88. const l = Atom.Location();
  89. let s = 0;
  90. let vA = 0, cC = 0, rC = 0;
  91. for (let i = 0, _i = unitIds.length; i < _i; i++) {
  92. const unit = units[unitIds[i]];
  93. l.unit = unit;
  94. const set = AtomSet.unitGetByIndex(atoms, i);
  95. const chainsIt = Segmentation.transientSegments(unit.hierarchy.chainSegments, set.atoms);
  96. const residues = unit.hierarchy.residueSegments;
  97. while (chainsIt.hasNext) {
  98. cC++;
  99. const chainSegment = chainsIt.move();
  100. const residuesIt = Segmentation.transientSegments(residues, set.atoms, chainSegment);
  101. while (residuesIt.hasNext) {
  102. rC++;
  103. const residueSegment = residuesIt.move();
  104. // l.atom = OrdSet.getAt(set, residueSegment.start);
  105. // console.log(unit.hierarchy.residues.auth_comp_id.value(unit.residueIndex[l.atom]), l.atom, OrdSet.getAt(set, residueSegment.end))
  106. for (let j = residueSegment.start, _j = residueSegment.end; j < _j; j++) {
  107. l.atom = AtomGroup.getAt(set, j);
  108. vA++;
  109. s += p(l);
  110. }
  111. }
  112. }
  113. }
  114. console.log('seg atom count', vA, cC, rC);
  115. return s;
  116. }
  117. function sumPropertyResidue(structure: Structure, p: Atom.Property<number>) {
  118. const { atoms, units } = structure;
  119. const unitIds = AtomSet.unitIds(atoms);
  120. const l = Atom.Location();
  121. let s = 0;
  122. for (let i = 0, _i = unitIds.length; i < _i; i++) {
  123. const unit = units[unitIds[i]];
  124. l.unit = unit;
  125. const set = AtomSet.unitGetByIndex(atoms, i);
  126. const residuesIt = Segmentation.transientSegments(unit.hierarchy.residueSegments, set.atoms);
  127. while (residuesIt.hasNext) {
  128. l.atom = AtomGroup.getAt(set, residuesIt.move().start);
  129. s += p(l);
  130. }
  131. }
  132. return s;
  133. }
  134. function sumPropertyAtomSetIt(structure: Structure, p: Atom.Property<number>) {
  135. const { atoms, units } = structure;
  136. let s = 0;
  137. const atomsIt = AtomSet.atoms(atoms);
  138. const l = Atom.Location();
  139. while (atomsIt.hasNext) {
  140. const a = atomsIt.move();
  141. l.unit = units[Atom.unit(a)];
  142. l.atom = Atom.index(a);
  143. s += p(l);
  144. }
  145. return s;
  146. }
  147. // function sumPropertySegmentedMutable(structure: Structure, p: Property<number>) {
  148. // const { atoms, units } = structure;
  149. // const unitIds = AtomSet.unitIds(atoms);
  150. // const l = Property.createLocation();
  151. // let s = 0;
  152. // for (let i = 0, _i = unitIds.length; i < _i; i++) {
  153. // const unit = units[unitIds[i]];
  154. // l.unit = unit;
  155. // const set = AtomSet.unitGetByIndex(atoms, i);
  156. // const chainsIt = Segmentation.transientSegments(unit.hierarchy.chainSegments, set);
  157. // const residuesIt = Segmentation.transientSegments(unit.hierarchy.residueSegments, set);
  158. // while (chainsIt.hasNext) {
  159. // const chainSegment = chainsIt.move();
  160. // residuesIt.updateRange(chainSegment);
  161. // while (residuesIt.hasNext) {
  162. // const residueSegment = residuesIt.move();
  163. // for (let j = residueSegment.start, _j = residueSegment.end; j < _j; j++) {
  164. // l.atom = OrdSet.getAt(set, j);
  165. // s += p(l);
  166. // }
  167. // }
  168. // }
  169. // }
  170. // return s;
  171. // }
  172. function sumDirect(structure: Structure) {
  173. const { atoms, units } = structure;
  174. const unitIds = AtomSet.unitIds(atoms);
  175. let s = 0;
  176. for (let i = 0, _i = unitIds.length; i < _i; i++) {
  177. const unitId = unitIds[i];
  178. const unit = units[unitId];
  179. const set = AtomSet.unitGetByIndex(atoms, i);
  180. //const { residueIndex, chainIndex } = unit;
  181. const p = unit.conformation.atomId.value;
  182. for (let j = 0, _j = AtomGroup.size(set); j < _j; j++) {
  183. const aI = AtomGroup.getAt(set, j);
  184. s += p(aI);
  185. }
  186. }
  187. return s;
  188. }
  189. // function concatProperty(structure: Structure, p: Property<string>) {
  190. // const { atoms, units } = structure;
  191. // const unitIds = AtomSet.unitIds(atoms);
  192. // const l = Property.createLocation(structure);
  193. // let s = [];
  194. // for (let i = 0, _i = unitIds.length; i < _i; i++) {
  195. // const unitId = unitIds[i];
  196. // l.unit = units[unitId];
  197. // const set = AtomSet.unitGetByIndex(atoms, i);
  198. // const { residueIndex, chainIndex } = l.unit;
  199. // for (let j = 0, _j = OrdSet.size(set); j < _j; j++) {
  200. // const aI = OrdSet.getAt(set, j);
  201. // l.atom = aI;
  202. // l.residueIndex = residueIndex[aI];
  203. // l.chainIndex = chainIndex[aI];
  204. // s[s.length] = p(l);
  205. // }
  206. // }
  207. // return s;
  208. // }
  209. export function write(s: Structure) {
  210. console.log(to_mmCIF('test', s));
  211. }
  212. export function testAssembly(id: string, s: Structure) {
  213. console.time('assembly')
  214. const a = Symmetry.buildAssembly(s, '1');
  215. console.timeEnd('assembly')
  216. fs.writeFileSync(`e:/test/molstar/${id}_assembly.bcif`, to_mmCIF(id, a, true));
  217. console.log('exported');
  218. //write(a);
  219. }
  220. export async function run() {
  221. //const { structures, models, mmcif } = await readCIF('./examples/1cbs_full.bcif');
  222. const { structures, models } = await readCIF('e:/test/quick/3j3q_full.bcif');
  223. //const { structures, models, mmcif } = await readCIF('e:/test/quick/1cbs_updated.cif');
  224. //const { structures, models/*, mmcif*/ } = await readCIF('e:/test/quick/5j7v_updated.cif');
  225. //console.log(mmcif.pdbx_struct_oper_list.matrix.toArray());
  226. // console.log(mmcif.pdbx_struct_oper_list.vector.toArray());
  227. // testAssembly('5j7v', structures[0]);
  228. // throw '';
  229. // console.log(models[0].symmetry.assemblies);
  230. //const { structures, models } = await readCIF('e:/test/molstar/3j3q.bcif');
  231. // fs.writeFileSync('e:/test/molstar/3j3q.bcif', to_mmCIF('test', structures[0], true));
  232. // return;
  233. // console.log(toMmCIFString('test', structures[0]));
  234. // return;
  235. console.log('bs', baseline(models[0]));
  236. console.log('sp', sumProperty(structures[0], l => l.unit.model.conformation.atomId.value(l.atom)));
  237. console.log(sumPropertySegmented(structures[0], l => l.unit.model.conformation.atomId.value(l.atom)));
  238. //console.log(sumPropertySegmentedMutable(structures[0], l => l.unit.model.conformation.atomId.value(l.atom)));
  239. console.log(sumPropertyAtomSetIt(structures[0], l => l.unit.model.conformation.atomId.value(l.atom)));
  240. //console.log(sumProperty(structures[0], Property.cachedAtomColumn(m => m.conformation.atomId)));
  241. console.log(sumDirect(structures[0]));
  242. console.log('r', sumPropertyResidue(structures[0], l => l.unit.hierarchy.residues.auth_seq_id.value(l.unit.residueIndex[l.atom])));
  243. console.time('atom.x');
  244. console.log('atom.x', sumProperty(structures[0], Q.props.atom.x));
  245. console.timeEnd('atom.x');
  246. console.time('__x')
  247. console.log('__x', sumProperty(structures[0], l => l.unit.conformation.x[l.atom]));
  248. console.timeEnd('__x')
  249. //const authSeqId = Atom.property(l => l.unit.hierarchy.residues.auth_seq_id.value(l.unit.residueIndex[l.atom]));
  250. //const auth_seq_id = Q.props.residue.auth_seq_id;
  251. const auth_comp_id = Q.props.residue.auth_comp_id;
  252. //const auth_asym_id = Q.props.chain.auth_asym_id;
  253. //const set = new Set(['A', 'B', 'C', 'D']);
  254. //const q = Q.generators.atomGroups({ atomTest: l => auth_seq_id(l) < 3 });
  255. const q = Q.generators.atoms({ atomTest: Q.pred.eq(Q.props.residue.auth_comp_id, 'ALA') });
  256. const P = Q.props
  257. //const q0 = Q.generators.atoms({ atomTest: l => auth_comp_id(l) === 'ALA' });
  258. const q1 = Q.generators.atoms({ residueTest: l => auth_comp_id(l) === 'ALA' });
  259. const q2 = Q.generators.atoms({ residueTest: l => auth_comp_id(l) === 'ALA', groupBy: Q.props.residue.key });
  260. const q3 = Q.generators.atoms({
  261. chainTest: Q.pred.inSet(P.chain.auth_asym_id, ['A', 'B', 'C', 'D']),
  262. residueTest: Q.pred.eq(P.residue.auth_comp_id, 'ALA')
  263. });
  264. q(structures[0]);
  265. //console.log(to_mmCIF('test', Selection.union(q0r)));
  266. console.time('q1')
  267. q1(structures[0]);
  268. console.timeEnd('q1')
  269. console.time('q1')
  270. q1(structures[0]);
  271. console.timeEnd('q1')
  272. console.time('q2')
  273. const q2r = q2(structures[0]);
  274. console.timeEnd('q2')
  275. console.log(Selection.structureCount(q2r));
  276. //console.log(q1(structures[0]));
  277. //const col = models[0].conformation.atomId.value;
  278. const suite = new B.Suite();
  279. suite
  280. //.add('test q', () => q1(structures[0]))
  281. //.add('test q', () => q(structures[0]))
  282. .add('test q1', () => q1(structures[0]))
  283. .add('test q3', () => q3(structures[0]))
  284. //.add('test int', () => sumProperty(structures[0], l => col(l.atom)))
  285. // .add('sum residue', () => sumPropertyResidue(structures[0], l => l.unit.hierarchy.residues.auth_seq_id.value(l.unit.residueIndex[l.atom])))
  286. // .add('baseline', () => baseline(models[0]))
  287. // .add('direct', () => sumDirect(structures[0]))
  288. //.add('normal int', () => sumProperty(structures[0], l => l.unit.model.conformation.atomId.value(l.atom)))
  289. //.add('atom set it int', () => sumPropertyAtomSetIt(structures[0], l => l.unit.conformation.atomId.value(l.atom)))
  290. // .add('segmented faster int', () => sumPropertySegmented(structures[0], l => l.unit.conformation.atomId.value(l.atom)))
  291. // .add('faster int', () => sumProperty(structures[0], l => l.unit.conformation.atomId.value(l.atom)))
  292. //.add('segmented faster _x', () => sumPropertySegmented(structures[0], l => l.unit.conformation.__x[l.atom]))
  293. //.add('faster _x', () => sumProperty(structures[0], l => l.unit.conformation.__x[l.atom] + l.unit.conformation.__y[l.atom] + l.unit.conformation.__z[l.atom]))
  294. //.add('segmented mut faster int', () => sumPropertySegmentedMutable(structures[0], l => l.unit.conformation.atomId.value(l.atom)))
  295. //.add('normal shortcut int', () => sumProperty(structures[0], l => l.conformation.atomId.value(l.atom)))
  296. //.add('cached int', () => sumProperty(structures[0], Property.cachedAtomColumn(m => m.conformation.atomId)))
  297. //.add('concat str', () => concatProperty(structures[0], l => l.unit.model.hierarchy.atoms.auth_atom_id.value(l.atom)))
  298. //.add('cached concat str', () => concatProperty(structures[0], Property.cachedAtomColumn(m => m.hierarchy.atoms.auth_atom_id)))
  299. .on('cycle', (e: any) => console.log(String(e.target)))
  300. .run();
  301. }
  302. }
  303. PropertyAccess.run();