BlosSOM
Interactive dimensionality reduction on large datasets (EmbedSOM and FLOWER combined)
color_data.cpp
Go to the documentation of this file.
1/* This file is part of BlosSOM.
2 *
3 * Copyright (C) 2021 Mirek Kratochvil
4 * Sona Molnarova
5 *
6 * BlosSOM is free software: you can redistribute it and/or modify it under
7 * the terms of the GNU General Public License as published by the Free
8 * Software Foundation, either version 3 of the License, or (at your option)
9 * any later version.
10 *
11 * BlosSOM is distributed in the hope that it will be useful, but WITHOUT ANY
12 * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
13 * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more
14 * details.
15 *
16 * You should have received a copy of the GNU General Public License along with
17 * BlosSOM. If not, see <https://www.gnu.org/licenses/>.
18 */
19
20#include "color_data.h"
21#include "pnorm.h"
22#include "vendor/colormap/palettes.hpp"
23
24void
26 const LandmarkModel &lm,
27 FrameStats &frame_stats)
28{
29 if (td.n != data.size()) {
30 data.resize(td.n, glm::vec4(0, 0, 0, 0));
31 refresh(td);
32 frame_stats.reset(frame_stats.color_t);
34 }
35
36 if (lm_watch.dirty(lm) && coloring == ColorData::Coloring::BRUSHING) {
37 landmarks.resize(lm.n_landmarks(), { &default_landmark_color, -1 });
38 refresh(td);
39 lm_watch.clean(lm);
40 }
41
42 auto [ri, rn] = dirty_range(td);
43 if (!rn) {
44 frame_stats.reset(frame_stats.color_t);
45 return;
46 }
47
48 const size_t max_points =
49 batch_size_gen.next(frame_stats.color_t, frame_stats.color_duration);
50
51 if (rn > max_points)
52 rn = max_points;
53
54 size_t n = td.n;
55 size_t d = td.dim();
56
57 clean_range(td, rn);
58
59 frame_stats.add_const_time();
60
61 switch (coloring) {
62 case int(ColorData::Coloring::EXPR): {
63 if (expr_col >= d)
64 expr_col = 0;
65
66 auto pal = colormap::palettes.at(col_palette).rescale(0, 1);
67 float mean = td.sums[expr_col] / n;
68 float sdev = sqrt(td.sqsums[expr_col] / n - mean * mean);
69
70 for (; rn-- > 0; ++ri) {
71 if (ri >= n)
72 ri = 0;
73 auto c =
75 ? pal(1 - pnormf(td.data[ri * d + expr_col], mean, sdev))
76 : pal(pnormf(td.data[ri * d + expr_col], mean, sdev));
77 data[ri] = glm::vec4(c.channels[0].val / 255.0f,
78 c.channels[1].val / 255.0f,
79 c.channels[2].val / 255.0f,
80 alpha);
81 }
82 } break;
83
84 case int(ColorData::Coloring::CLUSTER):
86 break;
87 case int(ColorData::Coloring::BRUSHING):
88 clustering.do_brushing(alpha, landmarks, lm, ri, rn, td, data);
89 break;
90 }
91
92 frame_stats.store_time(frame_stats.color_t);
93}
94
95void
96ColorData::color_landmarks(const std::vector<size_t> &idxs)
97{
98 for (auto &&i : idxs) {
100 }
101}
102
103void
105{
106 for (auto &&l : landmarks) {
107 if (l.second == id)
108 l = { &default_landmark_color, -1 };
109 }
110 touch_config();
111}
112
113void
115{
116 landmarks.erase(landmarks.begin() + ind);
117 touch_config();
118}
119
120void
122{
123 coloring = (int)Coloring::EXPR;
124 expr_col = 0;
125 col_palette = "rdbu";
126 alpha = 0.5f;
127 reverse = false;
129 auto lnds_size = landmarks.size();
130 landmarks = { lnds_size,
132 // Add none cluster, only for export of the data.
134
135 touch_config();
136}
137
138void
140{
141 auto index = clustering.active_cluster;
142 landmarks[ind] = { &clustering.clusters[index].first, index };
143
144 touch_config();
145}
size_t next(float T, float t)
Computes size of the next batch.
float pnormf(float x, float mean, float sd)
Definition: pnorm.cpp:155
void clean(const Dirt &d)
Call this when the cache is refreshed.
Definition: dirty.h:67
bool dirty(const Dirt &d)
Returns true if the cache needs to be refreshed.
Definition: dirty.h:60
int active_cluster
Index of the active cluster (into clusters) that is used for brushing.
Definition: cluster_data.h:53
void do_brushing(float alpha, const std::vector< std::pair< const glm::vec3 *, int > > &landmark_colors, const LandmarkModel &lm, size_t ri, size_t rn, const TransData &td, std::vector< glm::vec4 > &point_colors)
std::map< int, std::pair< glm::vec3, std::string > > clusters
Cluster colors and names for brushing, with id of cluster as a key.
Definition: cluster_data.h:49
void do_cluster_coloring(float alpha, size_t ri, size_t rn, const TransData &td, std::vector< glm::vec4 > &point_colors)
void update(const TransData &td, const LandmarkModel &lm, FrameStats &frame_stats)
Recomputes color of the 2D data points if user has changed any of the color settings.
Definition: color_data.cpp:25
void reset()
Resets color settings to their initial values.
Definition: color_data.cpp:121
void color_landmarks(const std::vector< size_t > &idxs)
Notifies Sweeper that the color settings has been modified and that the data has to be recomputed.
Definition: color_data.cpp:96
std::vector< std::pair< const glm::vec3 *, int > > landmarks
Colors of the landmarks and id of the cluster.
Definition: color_data.h:63
bool reverse
Flag indicating if the colors of the color palette should be reversed.
Definition: color_data.h:76
float alpha
Alpha channel of RGBA color.
Definition: color_data.h:73
int expr_col
Index of the column used in expression coloring.
Definition: color_data.h:67
void reset_landmark_color(int id)
Reset colors and cluster ids of all landmarks in the cluster with input id.
Definition: color_data.cpp:104
void remove_landmark(size_t ind)
Definition: color_data.cpp:114
ClusterData clustering
Definition: color_data.h:71
void touch_config()
Definition: color_data.h:118
Cleaner lm_watch
Definition: color_data.h:54
int coloring
Type of the coloring method.
Definition: color_data.h:65
void color_landmark(size_t ind)
Color the landmark according to the active cluster.
Definition: color_data.cpp:139
std::string col_palette
Name of the currently used color palette.
Definition: color_data.h:69
std::vector< glm::vec4 > data
Colors of the 2D data points.
Definition: color_data.h:59
const glm::vec3 default_landmark_color
Definition: color_data.h:52
BatchSizeGen batch_size_gen
Definition: color_data.h:78
size_t n
Definition: dirty.h:83
void add_const_time()
Definition: frame_stats.h:73
float color_t
Definition: frame_stats.h:33
void store_time(float &to)
Definition: frame_stats.h:79
void reset(float &t)
Definition: frame_stats.h:85
float color_duration
Definition: frame_stats.h:43
Model of the high- and low-dimensional landmarks.
size_t n_landmarks() const
Reurns number of the 2D landmarks.
std::tuple< size_t, size_t > dirty_range(const Dirts &d)
Find the range to refresh.
Definition: dirty.h:113
void clean_range(const Dirts &d, size_t n)
Clean a range of the cache.
Definition: dirty.h:130
void refresh(const Dirts &d)
Force-refresh the whole range.
Definition: dirty.h:105
Storage of the transformed data.
Definition: trans_data.h:74
size_t dim() const
Returns dimension of the transformed data.
Definition: trans_data.h:93
std::vector< float > data
Transformed data in the same format as DataModel::data.
Definition: trans_data.h:76
std::vector< float > sums
Array representing sums for each dimension.
Definition: trans_data.h:79
std::vector< float > sqsums
Array representing square sums for each dimension.
Definition: trans_data.h:81