/** * Copyright (c) 2017 molio contributors, licensed under MIT, See LICENSE file for more info. * * @author David Sehnal <david.sehnal@gmail.com> */ import { RawData } from '../formats' import { Frame as mmCIF } from '../../../mol-io/reader/cif/schema/mmcif' import Model from '../../model' import Column from '../../../mol-base/collections/column' import Table from '../../../mol-base/collections/table' import Interval from '../../../mol-base/collections/integer/interval' import Segmentation from '../../../mol-base/collections/integer/segmentation' import { newUUID } from '../../../mol-base/utils/uuid' import * as Hierarchy from '../properties/hierarchy' import Conformation from '../properties/conformation' import findHierarchyKeys from '../utils/hierarchy-keys' function findModelBounds(data: mmCIF, startIndex: number) { const num = data.atom_site.pdbx_PDB_model_num; const atomCount = num.rowCount; if (!num.isDefined) return Interval.ofBounds(startIndex, atomCount); let endIndex = startIndex + 1; while (endIndex < atomCount && num.areValuesEqual(startIndex, endIndex)) endIndex++; return Interval.ofBounds(startIndex, endIndex); } function findHierarchyOffsets(data: mmCIF, bounds: Interval) { const start = Interval.start(bounds), end = Interval.end(bounds); const residues = [start], chains = [start]; const { label_entity_id, auth_asym_id, auth_seq_id, pdbx_PDB_ins_code, label_comp_id } = data.atom_site; for (let i = start + 1; i < end; i++) { const newChain = !label_entity_id.areValuesEqual(i - 1, i) || !auth_asym_id.areValuesEqual(i - 1, i); const newResidue = newChain || !auth_seq_id.areValuesEqual(i - 1, i) || !pdbx_PDB_ins_code.areValuesEqual(i - 1, i) || !label_comp_id.areValuesEqual(i - 1, i); if (newResidue) residues[residues.length] = i; if (newChain) chains[chains.length] = i; } return { residues, chains }; } function createHierarchyData(data: mmCIF, bounds: Interval, offsets: { residues: ArrayLike<number>, chains: ArrayLike<number> }): Hierarchy.Data { const { atom_site } = data; const start = Interval.start(bounds), end = Interval.end(bounds); const atoms = Table.ofColumns<Hierarchy.AtomsSchema>({ type_symbol: Column.ofArray({ array: Column.mapToArray(Column.window(atom_site.type_symbol, start, end), Hierarchy.ElementSymbol), type: Column.Type.aliased<Hierarchy.ElementSymbol>(Column.Type.str) }), label_atom_id: Column.window(atom_site.label_atom_id, start, end), auth_atom_id: Column.window(atom_site.auth_atom_id, start, end), label_alt_id: Column.window(atom_site.label_alt_id, start, end), pdbx_formal_charge: Column.window(atom_site.pdbx_formal_charge, start, end) }); const residues = Table.view(atom_site, Hierarchy.ResiduesSchema, offsets.residues); const chains = Table.view(atom_site, Hierarchy.ChainsSchema, offsets.chains); return { atoms, residues, chains, entities: data.entity }; } function getConformation(data: mmCIF, bounds: Interval): Conformation { const start = Interval.start(bounds), end = Interval.end(bounds); const { atom_site } = data; return { id: Column.window(atom_site.id, start, end), occupancy: Column.window(atom_site.occupancy, start, end), B_iso_or_equiv: Column.window(atom_site.B_iso_or_equiv, start, end), x: atom_site.Cartn_x.toArray({ array: Float32Array, start, end }), y: atom_site.Cartn_y.toArray({ array: Float32Array, start, end }), z: atom_site.Cartn_z.toArray({ array: Float32Array, start, end }), } } function isHierarchyDataEqual(a: Hierarchy.Hierarchy, b: Hierarchy.Data) { // need to cast because of how TS handles type resolution for interfaces https://github.com/Microsoft/TypeScript/issues/15300 return Table.areEqual(a.chains as Table<Hierarchy.ChainsSchema>, b.chains as Table<Hierarchy.ChainsSchema>) && Table.areEqual(a.residues as Table<Hierarchy.ResiduesSchema>, b.residues as Table<Hierarchy.ResiduesSchema>) && Table.areEqual(a.atoms as Table<Hierarchy.AtomsSchema>, b.atoms as Table<Hierarchy.AtomsSchema>) } function createModel(raw: RawData, data: mmCIF, bounds: Interval, previous?: Model): Model { const hierarchyOffsets = findHierarchyOffsets(data, bounds); const hierarchyData = createHierarchyData(data, bounds, hierarchyOffsets); if (previous && isHierarchyDataEqual(previous.hierarchy, hierarchyData)) { return { ...previous, conformation: getConformation(data, bounds), version: { hierarchy: previous.version.hierarchy, conformation: newUUID() } }; } const hierarchySegments: Hierarchy.Segments = { residueSegments: Segmentation.ofOffsets(hierarchyOffsets.residues, bounds), chainSegments: Segmentation.ofOffsets(hierarchyOffsets.chains, bounds), } const hierarchyKeys = findHierarchyKeys(hierarchyData, hierarchySegments); return { id: newUUID(), sourceData: raw, model_num: data.atom_site.pdbx_PDB_model_num.value(Interval.start(bounds)), hierarchy: { ...hierarchyData, ...hierarchyKeys, ...hierarchySegments }, conformation: getConformation(data, bounds), version: { hierarchy: newUUID(), conformation: newUUID() }, atomCount: Interval.size(bounds) }; } function buildModels(data: mmCIF): ArrayLike<Model> { const raw: RawData = { source: 'mmCIF', data }; const models: Model[] = []; const atomCount = data.atom_site._rowCount; if (atomCount === 0) return models; let modelStart = 0; while (modelStart < atomCount) { const bounds = findModelBounds(data, modelStart); const model = createModel(raw, data, bounds, models.length > 0 ? models[models.length - 1] : void 0); models.push(model); modelStart = Interval.end(bounds); } return models; } export default buildModels;