laydi/system/dataset.py

from scipy import atleast_2d,asarray,ArrayType,shape,nonzero
from scipy import sort as array_sort
from itertools import izip

class Dataset:
    """The Dataset base class.
    
    A Dataset is an n-way array with defined string identifiers across
    all dimensions.

    example of use:

    ---
    dim_name_rows = 'rows'
    names_rows = ('row_a','row_b')
    ids_1 = [dim_name_rows, names_rows]

    dim_name_cols = 'cols'
    names_cols = ('col_a','col_b','col_c','col_d')
    ids_2 = [dim_name_cols, names_cols]

    Array_X = rand(2,4)
    data = Dataset(Array_X,(ids_1,ids_2),name="Testing")

    dim_names = [dim for dim in data]

    column_identifiers = [id for id in data['cols'].keys()]
    column_index = [index for index in data['cols'].values()]

    'cols' in data -> True

    ---

    data = Dataset(rand(10,20)) (generates dims and ids (no links))
    """
    def __init__(self,array,identifiers=None,name='Unnamed dataset'):
        self._dims = [] #existing dimensions in this dataset
        self._map = {} # internal mapping for dataset:  identifier <--> index
        self._name = name
        if isinstance(array,ArrayType):
            array = atleast_2d(asarray(array))
            self.shape = array.shape
            if identifiers!=None:
                self._set_identifiers(identifiers,self._all_dims)
            else:
                ids = self._create_identifiers(self.shape,self._all_dims)
                self._set_identifiers(ids,self._all_dims)
            
            self._array = array
            
        else:
            raise ValueError, "Array input must be of ArrayType"
                        
    def __str__(self):
        return self._name + ":\n" + "Dim names: " +  self._dims.__str__()

    def __iter__(self):
        """Returns an iterator over dimensions of dataset."""
        return self._dims.__iter__()

    def __contains__(self,dim):
        """Returns True if dim is a dimension name in dataset."""
        # return self._dims.__contains__(dim)
        return self._map.__contains__(dim)

    def __len__(self):
        """Returns the number of dimensions in the dataset"""
        return len(self._map)

    def __getitem__(self,dim):
        """Return the identifers along the dimension dim."""
        return self._map[dim]

    def _create_identifiers(self,shape,all_dims):
        """Creates dimension names and identifier names, and returns
        identifiers."""
        
        dim_names = ['rows','cols'] 
        ids = []
        for axis,n in enumerate(shape):
            if axis<2:
                dim_suggestion = dim_names[axis]
            else:
                dim_suggestion = 'dim'
            dim_suggestion = self._suggest_dim_name(dim_suggestion,all_dims) 
            identifier_creation = [str(axis) + "_" + i for i in map(str,range(n))]
            ids.append((dim_suggestion,identifier_creation))
            all_dims.add(dim_suggestion)
        return ids

    def _set_identifiers(self,identifiers,all_dims):
        """Creates internal mapping of identifiers structure."""
        for dim,ids in identifiers:
            pos_map={}
            if dim not in self._dims:
                self._dims.append(dim)
                all_dims.add(dim)
            else:
                raise ValueError, "Dimension names must be unique whitin dataset"
            
            for pos,id in enumerate(ids):
                pos_map[id] = pos
            self._map[dim] = pos_map
            
    def _suggest_dim_name(self,dim_name,all_dims):
        """Suggests a unique name for dim and returns it"""
        c = 0
        new_name = dim_name
        while new_name in all_dims:
            new_name = dim_name + "_" + str(c)
            c+=1
        return new_name
        
    def asarray(self):
        """Returns the numeric array (data) of dataset"""
        return self._array

    def add_array(self,array):
        """Adds array as an ArrayType object.
        A one-dim array is transformed to a two-dim array (row-vector)
        """
        
        if self.shape!=array.shape:
            raise ValueError, "Input array must be of similar dimensions as dataset"
        self._array = atleast_2d(asarray(array))

    def get_name(self):
        """Returns dataset name"""
        return self._name

    def get_all_dims(self):
        """Returns all dimensions in project"""
        return self._all_dims

    def get_dim_name(self,axis=None):
        """Returns dim name for an axis, if no axis is provided it returns a list of dims"""
        if type(axis)==int:
            return self._dims[axis]
        else:
            return [dim for dim in self]

    def get_identifiers(self, dim, indices=None,sorted=True):
        """Returns identifiers along dim, sorted by position (index) is optional.

        You can optionally provide a list of indices to get only the
        identifiers of a given position.

        Identifiers are the unique names (strings) for a variable in a given dim.
        Index (Indices) are the Identifiers position in a matrix in a given dim.
        """
        try:
            if len(indices)==0:# if empty list or empty array 
                indices=[]
        except:
            pass
        
        if sorted==True:
            items = self._map[dim].items()
            backitems = [ [v[1],v[0]] for v in items]
            backitems.sort()
            ids = [ backitems[i][1] for i in range(0,len(backitems))]
            
        else:
            ids = self._map[dim].keys()

        if indices != None:
            ids = [ids[index] for index in indices]

        return ids
        

    def get_indices(self, dim, idents=None):
        """Returns indices for identifiers along dimension.

        You can optionally provide a list of identifiers to retrieve a index subset.
        
        
        Identifiers are the unique names (strings) for a variable in a given dim.
        Index (Indices) are the Identifiers position in a matrix in a given dim."""
        if idents==None:
            index = array_sort(self._map[dim].values())
        else:
            index = [self._map[dim][key] for key in idents]
        return asarray(index)

class CategoryDataset(Dataset):
    """The category dataset class.

    A dataset for representing class information as binary
    matrices (0/1-matrices).

    There is support for using a less memory demanding, and
    fast intersection look-ups by representing the binary matrix as a
    dictionary in each dimension.

    Always has linked dimension in first dim:
    ex matrix:
             go_term1    go_term2  ...
    gene_1
    gene_2
    gene_3
    .
    .
    .
    """
    
    def __init__(self,array,identifiers=None,name='A'):
        Dataset.__init__(self,array,identifiers=identifiers,name=name)
        self.has_dictlists = False
            
    def as_dict_lists(self):
        """Returns data as dict of indices along first dim"""
        data={}
        for name,ind in self._map[self.get_dim_name(0)].items():
            data[name] = list(nonzero(self._array[ind,:]))
        self._dictlists = data
        self.has_dictlists=True
        return data       

class GraphDataset(Dataset):
    """The graph dataset class.

    A dataset class for representing graphs using an adjacency matrix
    (aka. restricted to square symmetric signed integers matrices)
    
    If the library NetworkX is installed, there is support for
    representing the graph as a NetworkX.Graph, or NetworkX.XGraph structure.
    """
    def __init__(self,array=None,identifiers=None,shape=None,all_dims=[],**kwds):
        Dataset.__init__(self,array=array,identifiers=identifiers,name='A')
        self.has_graph = False
        
    def asnetworkx(self,nx_type='graph'):
        dim = self.get_dim_name()[0]
        ids = self.get_identifiers(dim)
        adj_mat = self.asarray()
        G = self._graph_from_adj_matrix(adj_mat,labels=ids)
        self.has_graph = True
        return G
    
    def _graph_from_adj_matrix(self,A,labels=None,nx_type='graph'):
        """Creates a networkx graph class from adjacency matrix and ordered labels.
        nx_type = ['graph',['xgraph']]
        labels = None, results in string-numbered labels
        
        """
        import networkx as nx
        m,n = shape(A)# adjacency matrix must be of type that evals to true/false for neigbours
        if m!=n:
            raise IOError, "Adjacency matrix must be square"
        if nx_type=='graph':
            G = nx.Graph()
        elif nx_type=='x_graph':
            G = nx.XGraph()
        else:
            raise IOError, "Unknown graph type: %s" %nx_type

        if labels==None: # if labels not provided mark vertices with numbers
            labels = [str(i) for i in range(m)]

	
        for nbrs,head in izip(A,labels):
            for i,nbr in enumerate(nbrs):
                if nbr:
                    tail = labels[i]
                    G.add_edge(head,tail)
        return G

Dataset._all_dims=set()

class Selection:
    """Handles selected identifiers along each dimension of a dataset"""
    def __init__(self):
        self.current_selection={}
Added category dataset 2006-08-08 09:54:00 +02:00			`from scipy import atleast_2d,asarray,ArrayType,shape,nonzero`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`from scipy import sort as array_sort`
			`from itertools import izip`
First commit 2006-04-17 00:57:50 +02:00
			`class Dataset:`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`"""The Dataset base class.`

op 2006-04-17 11:08:40 +02:00			`A Dataset is an n-way array with defined string identifiers across`
			`all dimensions.`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00
			`example of use:`

			`---`
			`dim_name_rows = 'rows'`
			`names_rows = ('row_a','row_b')`
			`ids_1 = [dim_name_rows, names_rows]`

			`dim_name_cols = 'cols'`
			`names_cols = ('col_a','col_b','col_c','col_d')`
			`ids_2 = [dim_name_cols, names_cols]`

			`Array_X = rand(2,4)`
			`data = Dataset(Array_X,(ids_1,ids_2),name="Testing")`

			`dim_names = [dim for dim in data]`

			`column_identifiers = [id for id in data['cols'].keys()]`
			`column_index = [index for index in data['cols'].values()]`

			`'cols' in data -> True`

			`---`

			`data = Dataset(rand(10,20)) (generates dims and ids (no links))`
First commit 2006-04-17 00:57:50 +02:00			`"""`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`def __init__(self,array,identifiers=None,name='Unnamed dataset'):`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`self._dims = [] #existing dimensions in this dataset`
			`self._map = {} # internal mapping for dataset: identifier <--> index`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`self._name = name`
			`if isinstance(array,ArrayType):`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`array = atleast_2d(asarray(array))`
			`self.shape = array.shape`
			`if identifiers!=None:`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`self._set_identifiers(identifiers,self._all_dims)`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`else:`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`ids = self._create_identifiers(self.shape,self._all_dims)`
			`self._set_identifiers(ids,self._all_dims)`
mainly play in plots 2006-04-18 16:25:46 +02:00
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`self._array = array`

			`else:`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`raise ValueError, "Array input must be of ArrayType"`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00
* system/fluents.py: Fixed a bug where the the application tried to load a toolbar from None * system/plots.py: Fixed MainView.insert_view that was a no-op when in large view. * system/dataset.py: Changed __str__ of dataset to also show names of dimensions. 2006-07-21 16:30:09 +02:00			`def __str__(self):`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`return self._name + ":\n" + "Dim names: " + self._dims.__str__()`
Now can get and set name in Dataset. Also added getter for dim_names. 2006-04-21 14:28:29 +02:00
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`def __iter__(self):`
			`"""Returns an iterator over dimensions of dataset."""`
			`return self._dims.__iter__()`

			`def __contains__(self,dim):`
			`"""Returns True if dim is a dimension name in dataset."""`
			`# return self._dims.__contains__(dim)`
			`return self._map.__contains__(dim)`

			`def __len__(self):`
			`"""Returns the number of dimensions in the dataset"""`
			`return len(self._map)`

			`def __getitem__(self,dim):`
			`"""Return the identifers along the dimension dim."""`
			`return self._map[dim]`

			`def _create_identifiers(self,shape,all_dims):`
			`"""Creates dimension names and identifier names, and returns`
			`identifiers."""`
op 2006-04-17 11:08:40 +02:00
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`dim_names = ['rows','cols']`
			`ids = []`
			`for axis,n in enumerate(shape):`
			`if axis<2:`
			`dim_suggestion = dim_names[axis]`
			`else:`
			`dim_suggestion = 'dim'`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`dim_suggestion = self._suggest_dim_name(dim_suggestion,all_dims)`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`identifier_creation = [str(axis) + "_" + i for i in map(str,range(n))]`
			`ids.append((dim_suggestion,identifier_creation))`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`all_dims.add(dim_suggestion)`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`return ids`

			`def _set_identifiers(self,identifiers,all_dims):`
			`"""Creates internal mapping of identifiers structure."""`
			`for dim,ids in identifiers:`
			`pos_map={}`
			`if dim not in self._dims:`
			`self._dims.append(dim)`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`all_dims.add(dim)`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`else:`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`raise ValueError, "Dimension names must be unique whitin dataset"`
mainly overhaul of observers, and removal of project singleton 2006-04-20 12:27:58 +02:00
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`for pos,id in enumerate(ids):`
			`pos_map[id] = pos`
			`self._map[dim] = pos_map`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`def _suggest_dim_name(self,dim_name,all_dims):`
			`"""Suggests a unique name for dim and returns it"""`
			`c = 0`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`new_name = dim_name`
			`while new_name in all_dims:`
			`new_name = dim_name + "_" + str(c)`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`c+=1`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`return new_name`
category data and plot selection update\| 2006-04-19 12:37:44 +02:00
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`def asarray(self):`
			`"""Returns the numeric array (data) of dataset"""`
* system/plots.py: Added NetworkPlot, which may or may not work correctly. * system/dataset.py: Removed a few lines of obsolete code. 2006-08-01 15:22:39 +02:00			`return self._array`
category data and plot selection update\| 2006-04-19 12:37:44 +02:00
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`def add_array(self,array):`
			`"""Adds array as an ArrayType object.`
			`A one-dim array is transformed to a two-dim array (row-vector)`
category data and plot selection update\| 2006-04-19 12:37:44 +02:00			`"""`

removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`if self.shape!=array.shape:`
			`raise ValueError, "Input array must be of similar dimensions as dataset"`
			`self._array = atleast_2d(asarray(array))`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00
			`def get_name(self):`
get_dim_names and get_identifiers added in dataset 2006-04-24 13:23:30 +02:00			`"""Returns dataset name"""`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`return self._name`
get_dim_names and get_identifiers added in dataset 2006-04-24 13:23:30 +02:00
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`def get_all_dims(self):`
get_dim_names and get_identifiers added in dataset 2006-04-24 13:23:30 +02:00			`"""Returns all dimensions in project"""`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`return self._all_dims`

removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`def get_dim_name(self,axis=None):`
			`"""Returns dim name for an axis, if no axis is provided it returns a list of dims"""`
			`if type(axis)==int:`
			`return self._dims[axis]`
			`else:`
			`return [dim for dim in self]`
get_dim_names and get_identifiers added in dataset 2006-04-24 13:23:30 +02:00
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`def get_identifiers(self, dim, indices=None,sorted=True):`
			`"""Returns identifiers along dim, sorted by position (index) is optional.`
Implemented Dataset.get_indices() and extended Dataset.get_identifiers() to convert between indices and identifiers and subsets thereof. Also added tests. 2006-05-02 16:06:48 +02:00
			`You can optionally provide a list of indices to get only the`
			`identifiers of a given position.`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00
			`Identifiers are the unique names (strings) for a variable in a given dim.`
			`Index (Indices) are the Identifiers position in a matrix in a given dim.`
Implemented Dataset.get_indices() and extended Dataset.get_identifiers() to convert between indices and identifiers and subsets thereof. Also added tests. 2006-05-02 16:06:48 +02:00			`"""`
2006-08-01 13:01:52 +02:00			`try:`
			`if len(indices)==0:# if empty list or empty array`
			`indices=[]`
			`except:`
			`pass`

removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`if sorted==True:`
			`items = self._map[dim].items()`
			`backitems = [ [v[1],v[0]] for v in items]`
			`backitems.sort()`
			`ids = [ backitems[i][1] for i in range(0,len(backitems))]`

Implemented Dataset.get_indices() and extended Dataset.get_identifiers() to convert between indices and identifiers and subsets thereof. Also added tests. 2006-05-02 16:06:48 +02:00			`else:`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`ids = self._map[dim].keys()`

			`if indices != None:`
bugfix in get_identifiers 2006-08-01 12:33:45 +02:00			`ids = [ids[index] for index in indices]`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00
			`return ids`


			`def get_indices(self, dim, idents=None):`
			`"""Returns indices for identifiers along dimension.`

			`You can optionally provide a list of identifiers to retrieve a index subset.`


			`Identifiers are the unique names (strings) for a variable in a given dim.`
			`Index (Indices) are the Identifiers position in a matrix in a given dim."""`
			`if idents==None:`
			`index = array_sort(self._map[dim].values())`
			`else:`
bugfix in get_identifiers 2006-08-01 12:33:45 +02:00			`index = [self._map[dim][key] for key in idents]`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`return asarray(index)`
Added category dataset 2006-08-08 09:54:00 +02:00
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`class CategoryDataset(Dataset):`
			`"""The category dataset class.`

			`A dataset for representing class information as binary`
			`matrices (0/1-matrices).`

			`There is support for using a less memory demanding, and`
			`fast intersection look-ups by representing the binary matrix as a`
			`dictionary in each dimension.`
Added category dataset 2006-08-08 09:54:00 +02:00
			`Always has linked dimension in first dim:`
			`ex matrix:`
			`go_term1 go_term2 ...`
			`gene_1`
			`gene_2`
			`gene_3`
			`.`
			`.`
			`.`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`"""`

Added category dataset 2006-08-08 09:54:00 +02:00			`def __init__(self,array,identifiers=None,name='A'):`
			`Dataset.__init__(self,array,identifiers=identifiers,name=name)`
			`self.has_dictlists = False`
category data and plot selection update\| 2006-04-19 12:37:44 +02:00
Added category dataset 2006-08-08 09:54:00 +02:00			`def as_dict_lists(self):`
			`"""Returns data as dict of indices along first dim"""`
			`data={}`
			`for name,ind in self._map[self.get_dim_name(0)].items():`
			`data[name] = list(nonzero(self._array[ind,:]))`
			`self._dictlists = data`
			`self.has_dictlists=True`
			`return data`
category data and plot selection update\| 2006-04-19 12:37:44 +02:00
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`class GraphDataset(Dataset):`
			`"""The graph dataset class.`

			`A dataset class for representing graphs using an adjacency matrix`
			`(aka. restricted to square symmetric signed integers matrices)`

			`If the library NetworkX is installed, there is support for`
			`representing the graph as a NetworkX.Graph, or NetworkX.XGraph structure.`
			`"""`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`def __init__(self,array=None,identifiers=None,shape=None,all_dims=[],**kwds):`
			`Dataset.__init__(self,array=array,identifiers=identifiers,name='A')`
Complete rewrite of dataset class, with (all) the necessary updates 2006-04-24 11:53:07 +02:00			`self.has_graph = False`

removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`def asnetworkx(self,nx_type='graph'):`
* system/plots.py: Added NetworkPlot, which may or may not work correctly. * system/dataset.py: Removed a few lines of obsolete code. 2006-08-01 15:22:39 +02:00			`dim = self.get_dim_name()[0]`
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`ids = self.get_identifiers(dim)`
			`adj_mat = self.asarray()`
			`G = self._graph_from_adj_matrix(adj_mat,labels=ids)`
			`self.has_graph = True`
			`return G`

			`def _graph_from_adj_matrix(self,A,labels=None,nx_type='graph'):`
			`"""Creates a networkx graph class from adjacency matrix and ordered labels.`
			`nx_type = ['graph',['xgraph']]`
			`labels = None, results in string-numbered labels`

			`"""`
			`import networkx as nx`
			`m,n = shape(A)# adjacency matrix must be of type that evals to true/false for neigbours`
			`if m!=n:`
			`raise IOError, "Adjacency matrix must be square"`
			`if nx_type=='graph':`
			`G = nx.Graph()`
			`elif nx_type=='x_graph':`
			`G = nx.XGraph()`
			`else:`
			`raise IOError, "Unknown graph type: %s" %nx_type`

			`if labels==None: # if labels not provided mark vertices with numbers`
			`labels = [str(i) for i in range(m)]`


			`for nbrs,head in izip(A,labels):`
			`for i,nbr in enumerate(nbrs):`
			`if nbr:`
			`tail = labels[i]`
			`G.add_edge(head,tail)`
			`return G`
* system/plots.py: Added NetworkPlot, which may or may not work correctly. * system/dataset.py: Removed a few lines of obsolete code. 2006-08-01 15:22:39 +02:00
removed shape in constructor, added all_dims to dataset base class, updated get_identifiers and get_indices Denne linjen og de som er under vil bli ignorert-- M dataset.py 2006-08-01 11:45:53 +02:00			`Dataset._all_dims=set()`

First commit 2006-04-17 00:57:50 +02:00			`class Selection:`
op 2006-04-17 11:08:40 +02:00			`"""Handles selected identifiers along each dimension of a dataset"""`
First commit 2006-04-17 00:57:50 +02:00			`def __init__(self):`
			`self.current_selection={}`
Added a selection view tab, placed next to the "Log" tab. The tab currently only displays the current selection. 2006-08-07 16:14:42 +02:00