/** * Copyright (c) 2017 mol* contributors, licensed under MIT, See LICENSE file for more info. * * @author David Sehnal <david.sehnal@gmail.com> */ import * as B from 'benchmark' import * as util from 'util' import * as fs from 'fs' import fetch from 'node-fetch' import CIF from 'mol-io/reader/cif' import { Structure, Model, Queries as Q, Element, ElementGroup, ElementSet, Selection, Symmetry, Unit } from 'mol-model/structure' import { Segmentation, OrderedSet } from 'mol-data/int' import to_mmCIF from 'mol-model/structure/export/mmcif' import { Run } from 'mol-task'; import { EquivalenceClasses } from 'mol-data/util'; require('util.promisify').shim(); const readFileAsync = util.promisify(fs.readFile); const writeFileAsync = util.promisify(fs.writeFile); async function readData(path: string) { if (path.match(/\.bcif$/)) { const input = await readFileAsync(path) const data = new Uint8Array(input.byteLength); for (let i = 0; i < input.byteLength; i++) data[i] = input[i]; return data; } else { return readFileAsync(path, 'utf8'); } } (Symbol as any).asyncIterator = (Symbol as any).asyncIterator || Symbol.for('Symbol.asyncIterator'); interface ProgressGenerator<T> extends AsyncIterableIterator<number | T> { next(cont?: boolean): Promise<IteratorResult<number | T>> } async function *test(): ProgressGenerator<boolean> { const r = yield await new Promise<number>(res => res(10)); return r; } async function runIt(itP: () => ProgressGenerator<boolean>) { const it = itP(); while (true) { const { value, done } = await it.next(true); if (done) return value; } } runIt(test).then(r => console.log('rerdasdasda', r)) export async function readCIF(path: string) { console.time('readData'); const input = await readData(path) console.timeEnd('readData'); console.time('parse'); const comp = typeof input === 'string' ? CIF.parseText(input) : CIF.parseBinary(input); const parsed = await Run(comp); console.timeEnd('parse'); if (parsed.isError) { throw parsed; } const data = parsed.result.blocks[0]; console.time('schema') const mmcif = CIF.schema.mmCIF(data); console.timeEnd('schema') console.time('buildModels') const models = Model.create({ kind: 'mmCIF', data: mmcif }); console.timeEnd('buildModels') const structures = models.map(Structure.ofModel); return { mmcif, models, structures }; } const DATA_DIR = './build/data'; if (!fs.existsSync(DATA_DIR)) fs.mkdirSync(DATA_DIR); function getBcifUrl(pdbId: string) { return `http://www.ebi.ac.uk/pdbe/coordinates/${pdbId.toLowerCase()}/full?encoding=bcif` } function getBcifPath(pdbId: string) { return `${DATA_DIR}/${pdbId.toLowerCase()}_full.bcif` } async function ensureBcifAvailable(pdbId: string) { const bcifPath = getBcifPath(pdbId); if (!fs.existsSync(bcifPath)) { console.log(`downloading ${pdbId} bcif...`) const data = await fetch(getBcifUrl(pdbId)) await writeFileAsync(bcifPath, await data.buffer()) console.log(`done downloading ${pdbId} bcif`) } } export async function getBcif(pdbId: string) { await ensureBcifAvailable(pdbId); return await readCIF(getBcifPath(pdbId)); } export namespace PropertyAccess { function baseline(model: Model) { if (model.sourceData.kind !== 'mmCIF') throw new Error('Model must be mmCIF'); const atom_site = model.sourceData.data.atom_site; const id = atom_site.id.value; let s = 0; for (let i = 0, _i = atom_site._rowCount; i < _i; i++) { s += id(i); } return s; } function sumProperty(structure: Structure, p: Element.Property<number>) { const { elements, units } = structure; const unitIds = ElementSet.unitIds(elements); const l = Element.Location(); let s = 0; for (let i = 0, _i = unitIds.length; i < _i; i++) { l.unit = units[unitIds[i]]; const set = ElementSet.unitGetByIndex(elements, i); for (let j = 0, _j = ElementGroup.size(set); j < _j; j++) { l.element= ElementGroup.getAt(set, j); s += p(l); } } return s; } function sumPropertySegmented(structure: Structure, p: Element.Property<number>) { const { elements, units } = structure; const unitIds = ElementSet.unitIds(elements); const l = Element.Location(); let s = 0; let vA = 0, cC = 0, rC = 0; for (let i = 0, _i = unitIds.length; i < _i; i++) { const unit = units[unitIds[i]]; l.unit = unit; const set = ElementSet.unitGetByIndex(elements, i); const chainsIt = Segmentation.transientSegments(unit.hierarchy.chainSegments, set.elements); const residues = unit.hierarchy.residueSegments; while (chainsIt.hasNext) { cC++; const chainSegment = chainsIt.move(); const residuesIt = Segmentation.transientSegments(residues, set.elements, chainSegment); while (residuesIt.hasNext) { rC++; const residueSegment = residuesIt.move(); // l.element= OrdSet.getAt(set, residueSegment.start); // console.log(unit.hierarchy.residues.auth_comp_id.value(unit.residueIndex[l.atom]), l.atom, OrdSet.getAt(set, residueSegment.end)) for (let j = residueSegment.start, _j = residueSegment.end; j < _j; j++) { l.element= ElementGroup.getAt(set, j); vA++; s += p(l); } } } } console.log('seg atom count', vA, cC, rC); return s; } // function sumPropertyResidue(structure: Structure, p: Element.Property<number>) { // const { atoms, units } = structure; // const unitIds = ElementSet.unitIds(atoms); // const l = Element.Location(); // let s = 0; // for (let i = 0, _i = unitIds.length; i < _i; i++) { // const unit = units[unitIds[i]]; // l.unit = unit; // const set = ElementSet.unitGetByIndex(atoms, i); // const residuesIt = Segmentation.transientSegments(unit.hierarchy.residueSegments, set.atoms); // while (residuesIt.hasNext) { // l.element= ElementGroup.getAt(set, residuesIt.move().start); // s += p(l); // } // } // return s; // } function sumPropertyAtomSetIt(structure: Structure, p: Element.Property<number>) { const { elements, units } = structure; let s = 0; const atomsIt = ElementSet.elements(elements); const l = Element.Location(); while (atomsIt.hasNext) { const a = atomsIt.move(); l.unit = units[Element.unit(a)]; l.element= Element.index(a); s += p(l); } return s; } // function sumPropertySegmentedMutable(structure: Structure, p: Property<number>) { // const { atoms, units } = structure; // const unitIds = ElementSet.unitIds(atoms); // const l = Property.createLocation(); // let s = 0; // for (let i = 0, _i = unitIds.length; i < _i; i++) { // const unit = units[unitIds[i]]; // l.unit = unit; // const set = ElementSet.unitGetByIndex(atoms, i); // const chainsIt = Segmentation.transientSegments(unit.hierarchy.chainSegments, set); // const residuesIt = Segmentation.transientSegments(unit.hierarchy.residueSegments, set); // while (chainsIt.hasNext) { // const chainSegment = chainsIt.move(); // residuesIt.updateRange(chainSegment); // while (residuesIt.hasNext) { // const residueSegment = residuesIt.move(); // for (let j = residueSegment.start, _j = residueSegment.end; j < _j; j++) { // l.element= OrdSet.getAt(set, j); // s += p(l); // } // } // } // } // return s; // } // function sumDirect(structure: Structure) { // const { atoms, units } = structure; // const unitIds = ElementSet.unitIds(atoms); // let s = 0; // for (let i = 0, _i = unitIds.length; i < _i; i++) { // const unitId = unitIds[i]; // const unit = units[unitId]; // const set = ElementSet.unitGetByIndex(atoms, i); // //const { residueIndex, chainIndex } = unit; // const p = unit.conformation.atomId.value; // for (let j = 0, _j = ElementGroup.size(set); j < _j; j++) { // const aI = ElementGroup.getAt(set, j); // s += p(aI); // } // } // return s; // } // function concatProperty(structure: Structure, p: Property<string>) { // const { atoms, units } = structure; // const unitIds = ElementSet.unitIds(atoms); // const l = Property.createLocation(structure); // let s = []; // for (let i = 0, _i = unitIds.length; i < _i; i++) { // const unitId = unitIds[i]; // l.unit = units[unitId]; // const set = ElementSet.unitGetByIndex(atoms, i); // const { residueIndex, chainIndex } = l.unit; // for (let j = 0, _j = OrdSet.size(set); j < _j; j++) { // const aI = OrdSet.getAt(set, j); // l.element= aI; // l.residueIndex = residueIndex[aI]; // l.chainIndex = chainIndex[aI]; // s[s.length] = p(l); // } // } // return s; // } export function write(s: Structure) { console.log(to_mmCIF('test', s)); } export function testAssembly(id: string, s: Structure) { console.time('assembly') const a = Symmetry.buildAssembly(s, '1'); console.timeEnd('assembly') fs.writeFileSync(`${DATA_DIR}/${id}_assembly.bcif`, to_mmCIF(id, a, true)); console.log('exported'); } export function testGrouping(structure: Structure) { const { elements, units } = Symmetry.buildAssembly(structure, '1'); console.log('grouping', units.length); console.log('built asm'); const uniqueGroups = EquivalenceClasses<number, { unit: Unit, group: ElementGroup }>( ({ unit, group }) => ElementGroup.hashCode(group), (a, b) => a.unit.model.id === b.unit.model.id && (a.group.key === b.group.key && OrderedSet.areEqual(a.group.elements, b.group.elements)) ); for (let i = 0, _i = ElementSet.unitCount(elements); i < _i; i++) { const group = ElementSet.unitGetByIndex(elements, i); const unitId = ElementSet.unitGetId(elements, i); uniqueGroups.add(unitId, { unit: units[unitId], group }); } console.log('group count', uniqueGroups.groups.length); } export async function run() { //const { structures, models/*, mmcif*/ } = await getBcif('1cbs'); // const { structures, models } = await getBcif('3j3q'); const { structures, models /*, mmcif*/ } = await readCIF('e:/test/quick/1hrv_updated.cif'); const { structures: s1, /*, mmcif*/ } = await readCIF('e:/test/quick/1tqn_updated.cif'); testGrouping(structures[0]); console.log('------'); testGrouping(s1[0]); //const { structures, models/*, mmcif*/ } = await readCIF('e:/test/quick/5j7v_updated.cif'); //console.log(mmcif.pdbx_struct_oper_list.matrix.toArray()); // console.log(mmcif.pdbx_struct_oper_list.vector.toArray()); // testAssembly('5j7v', structures[0]); // throw ''; // console.log(models[0].symmetry.assemblies); //const { structures, models } = await readCIF('e:/test/molstar/3j3q.bcif'); // fs.writeFileSync('e:/test/molstar/3j3q.bcif', to_mmCIF('test', structures[0], true)); // return; // console.log(toMmCIFString('test', structures[0])); // return; console.log('bs', baseline(models[0])); console.log('sp', sumProperty(structures[0], l => l.unit.model.conformation.atomId.value(l.element))); console.log(sumPropertySegmented(structures[0], l => l.unit.model.conformation.atomId.value(l.element))); //console.log(sumPropertySegmentedMutable(structures[0], l => l.unit.model.conformation.atomId.value(l.element)); console.log(sumPropertyAtomSetIt(structures[0], l => l.unit.model.conformation.atomId.value(l.element))); //console.log(sumProperty(structures[0], Property.cachedAtomColumn(m => m.conformation.atomId))); //console.log(sumDirect(structures[0])); //console.log('r', sumPropertyResidue(structures[0], l => l.unit.hierarchy.residues.auth_seq_id.value(l.unit.residueIndex[l.atom]))); console.time('atom.x'); console.log('atom.x', sumProperty(structures[0], Q.props.atom.x)); console.timeEnd('atom.x'); console.time('__x') //console.log('__x', sumProperty(structures[0], l => l.unit.conformation.x[l.atom])); console.timeEnd('__x') //const authSeqId = Element.property(l => l.unit.hierarchy.residues.auth_seq_id.value(l.unit.residueIndex[l.atom])); //const auth_seq_id = Q.props.residue.auth_seq_id; const auth_comp_id = Q.props.residue.auth_comp_id; //const auth_asym_id = Q.props.chain.auth_asym_id; //const set = new Set(['A', 'B', 'C', 'D']); //const q = Q.generators.atomGroups({ atomTest: l => auth_seq_id(l) < 3 }); const q = Q.generators.atoms({ atomTest: Q.pred.eq(Q.props.residue.auth_comp_id, 'ALA') }); const P = Q.props //const q0 = Q.generators.atoms({ atomTest: l => auth_comp_id(l) === 'ALA' }); const q1 = Q.generators.atoms({ residueTest: l => auth_comp_id(l) === 'ALA' }); const q2 = Q.generators.atoms({ residueTest: l => auth_comp_id(l) === 'ALA', groupBy: Q.props.residue.key }); const q3 = Q.generators.atoms({ chainTest: Q.pred.inSet(P.chain.auth_asym_id, ['A', 'B', 'C', 'D']), residueTest: Q.pred.eq(P.residue.auth_comp_id, 'ALA') }); q(structures[0]); //console.log(to_mmCIF('test', Selection.union(q0r))); console.time('q1') q1(structures[0]); console.timeEnd('q1') console.time('q1') q1(structures[0]); console.timeEnd('q1') console.time('q2') const q2r = q2(structures[0]); console.timeEnd('q2') console.log(Selection.structureCount(q2r)); //console.log(q1(structures[0])); //const col = models[0].conformation.atomId.value; const suite = new B.Suite(); suite //.add('test q', () => q1(structures[0])) //.add('test q', () => q(structures[0])) .add('test q1', () => q1(structures[0])) .add('test q3', () => q3(structures[0])) //.add('test int', () => sumProperty(structures[0], l => col(l.element)) // .add('sum residue', () => sumPropertyResidue(structures[0], l => l.unit.hierarchy.residues.auth_seq_id.value(l.unit.residueIndex[l.atom]))) // .add('baseline', () => baseline(models[0])) // .add('direct', () => sumDirect(structures[0])) //.add('normal int', () => sumProperty(structures[0], l => l.unit.model.conformation.atomId.value(l.element)) //.add('atom set it int', () => sumPropertyAtomSetIt(structures[0], l => l.unit.conformation.atomId.value(l.element)) // .add('segmented faster int', () => sumPropertySegmented(structures[0], l => l.unit.conformation.atomId.value(l.element)) // .add('faster int', () => sumProperty(structures[0], l => l.unit.conformation.atomId.value(l.element)) //.add('segmented faster _x', () => sumPropertySegmented(structures[0], l => l.unit.conformation.__x[l.atom])) //.add('faster _x', () => sumProperty(structures[0], l => l.unit.conformation.__x[l.atom] + l.unit.conformation.__y[l.atom] + l.unit.conformation.__z[l.atom])) //.add('segmented mut faster int', () => sumPropertySegmentedMutable(structures[0], l => l.unit.conformation.atomId.value(l.element)) //.add('normal shortcut int', () => sumProperty(structures[0], l => l.conformation.atomId.value(l.element)) //.add('cached int', () => sumProperty(structures[0], Property.cachedAtomColumn(m => m.conformation.atomId))) //.add('concat str', () => concatProperty(structures[0], l => l.unit.model.hierarchy.atoms.auth_atom_id.value(l.element)) //.add('cached concat str', () => concatProperty(structures[0], Property.cachedAtomColumn(m => m.hierarchy.atoms.auth_atom_id))) .on('cycle', (e: any) => console.log(String(e.target))) .run(); } } PropertyAccess.run();