lattice/tensorflow_lattice/python/linear_layer.py at v2.1.0 · tensorflow/lattice

History

1

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24

25

26

27

28

29

30

31

32

33

34

35

36

37

38

39

40

41

42

43

44

45

46

47

48

49

50

51

52

53

54

55

56

57

58

59

60

61

62

63

64

65

66

67

68

69

70

71

72

73

74

75

76

77

78

79

80

81

82

83

84

85

86

87

88

89

90

91

92

93

94

95

96

97

98

99

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

329

330

331

332

333

334

335

336

337

338

339

340

341

342

343

344

345

346

347

348

349

350

351

352

353

354

355

356

357

358

359

360

361

362

363

364

365

366

367

368

369

370

371

372

373

374

375

376

377

378

379

380

381

382

383

384

385

386

387

388

389

390

391

392

393

394

395

396

397

398

399

400

401

402

403

404

405

406

407

408

409

410

411

412

413

414

415

416

417

418

419

420

421

422

423

424

425

426

427

428

429

430

431

432

433

434

#

# Licensed under the Apache License, Version 2.0 (the "License");

# you may not use this file except in compliance with the License.

# You may obtain a copy of the License at

#

# http://www.apache.org/licenses/LICENSE-2.0

#

# Unless required by applicable law or agreed to in writing, software

# distributed under the License is distributed on an "AS IS" BASIS,

# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

# See the License for the specific language governing permissions and

# limitations under the License.

"""Layer which represents linear function. See class level comment.

This layer applies a linear transformation to the input tensor with an optional

bias term. It supports monotonicity, monotonic dominance and fixed-norm

constraints.

"""

from __future__ import absolute_import

from __future__ import division

from __future__ import print_function

import numpy as np

import tensorflow as tf

# pylint: disable=g-import-not-at-top

# Use Keras 2.

version_fn = getattr(tf.keras, "version", None)

if version_fn and version_fn().startswith("3."):

import tf_keras as keras

else:

keras = tf.keras

from . import linear_lib

from . import utils

LINEAR_LAYER_KERNEL_NAME = "linear_layer_kernel"

LINEAR_LAYER_BIAS_NAME = "linear_layer_bias"

class Linear(keras.layers.Layer):

# pyformat: disable

"""Layer which represents linear function.

Monotonicity can be specified for any input dimension in which case learned

weight for that dimension is guaranteed to be either non negative for

increasing or non positive for decreasing monotonicity.

Monotonic dominance can be specified for any pair of dimensions referred to as

*dominant* and *weak* dimensions such that the effect (slope) in the direction

of the *dominant* dimension to be greater than that of the *weak* dimension

for any point. Both dominant and weak dimensions must be increasing.

Range dominance can be specified for any pair of *dominant* and *weak*

dimensions such that the range of possible outputs to be greater if one varies

the *dominant* dimension than if one varies the *weak* dimension for any

point. We require the slope of the *dominant* dimension scaled by its input

range to be greater than the slope of the *weak* dimension similarly scaled by

its input range. Both dimensions must have the same direction of monotonicity

and their input min and max must be provided.

Weights can be constrained to have a fixed norm.

Input shape:

- if `units == 1`: tensor of shape: `(batch_size, num_input_dims)`.

- if `units > 1`: tensor of shape: `(batch_size, units, num_input_dims)`

Output shape:

Rank-2 tensor with shape: (batch_size, units)

Attributes:

- All `__init__ `arguments.

kernel: layer's kernel.

bias: layer's bias. Only available if `use_bias == True`.

Example:

```python

layer = tfl.layers.Linear(

num_input_dims=8,

# Monotonicity constraints can be defined per dimension or for all dims.

monotonicities='increasing',

use_bias=True,

# You can force the L1 norm to be 1. Since this is a monotonic layer,

# the coefficients will sum to 1, making this a "weighted average".

normalization_order=1)

```

"""

# pyformat: enable

def __init__(self,

num_input_dims,

units=1,

monotonicities=None,

monotonic_dominances=None,

range_dominances=None,

input_min=None,

input_max=None,

use_bias=True,

normalization_order=None,

kernel_initializer="random_uniform",

bias_initializer="random_uniform",

kernel_regularizer=None,

bias_regularizer=None,

**kwargs):

"""initializes an instance of `Linear`.

Args:

num_input_dims: Number of input dimensions.

units: Output dimension of the layer.

monotonicities: None or list or tuple of length 'num_input_dims' of

{'decreasing', 'none', 'increasing', -1, 0, 1} which specifies if the

model output should be monotonic in corresponding feature, using

'increasing' or 1 to indicate increasing monotonicity, 'decreasing' or

-1 to indicate decreasing monotonicity and 'none' or 0 to indicate no

monotonicity constraints. In case of decreasing monotonicity

corresponding weight will be constrained to be non positive, in case of

increasing non-negative. Instead of a list or tuple single value can be

specified to indicate the monotonicity constraint across all dimensions.

monotonic_dominances: None or list of two-element tuples. First element is

the index of the dominant dimension. Second element is the index of the

weak dimension.

range_dominances: None or list of two-element tuples. First element is the

index of the dominant dimension. Second element is the index of the weak

dimension. Both dominant and weak dimensions must have input_min and

input_max set.

input_min: None of list or tuple of length 'num_input_dims' of either

'none' or float which specifies the minimum value to clip by for each

dimension.

input_max: None of list or tuple of length 'num_input_dims' of either

'none' or float which specifies the maximum value to clip by for each

dimension.

use_bias: Whether linear function has bias.

normalization_order: If specified learned weights will be adjusted to have

norm 1. Norm will be computed by: `tf.norm(tensor,

ord=normalization_order)`.

kernel_initializer: Any keras initializer to be applied to kernel.

bias_initializer: Any keras initializer to be applied to bias. Only valid

if `use_bias == True`.

kernel_regularizer: None or single element or list of any Keras

regularizer objects.

bias_regularizer: None or single element or list of any Keras regularizer

objects.

**kwargs: Other args passed to `keras.layers.Layer` initializer.

Raises:

ValueError: if monotonicity specified incorrectly.

"""

super(Linear, self).__init__(**kwargs)

self.num_input_dims = num_input_dims

self.units = units

if isinstance(monotonicities, list) or isinstance(monotonicities, tuple):

self.monotonicities = list(monotonicities)

elif monotonicities is not None:

self.monotonicities = [monotonicities] * self.num_input_dims

else:

self.monotonicities = [0] * self.num_input_dims

self.monotonic_dominances = monotonic_dominances

self.range_dominances = range_dominances

self.input_min = input_min

self.input_max = input_max

# Verify hyperparameters after converting monotonicities to list because

# internally everything expects monotonicites to be list or tuple rather

# than single element.

linear_lib.verify_hyperparameters(

num_input_dims=self.num_input_dims, monotonicities=self.monotonicities)

self.use_bias = use_bias

self.normalization_order = normalization_order

self.kernel_initializer = keras.initializers.get(kernel_initializer)

if use_bias:

self.bias_initializer = keras.initializers.get(bias_initializer)

self.kernel_regularizer = []

if kernel_regularizer:

if callable(kernel_regularizer):

kernel_regularizer = [kernel_regularizer]

for reg in kernel_regularizer:

self.kernel_regularizer.append(keras.regularizers.get(reg))

self.bias_regularizer = []

if bias_regularizer:

if callable(bias_regularizer):

bias_regularizer = [bias_regularizer]

for reg in bias_regularizer:

self.bias_regularizer.append(keras.regularizers.get(reg))

if units == 1:

input_shape = (None, num_input_dims)

else:

input_shape = (None, units, num_input_dims)

self.input_spec = keras.layers.InputSpec(

dtype=self.dtype, shape=input_shape)

def build(self, input_shape):

"""Standard Keras build() method.

Args:

input_shape: Must be: (batch_size, num_input_dims) if units == 1, or

(batch_size, units, num_input_dims) if units > 1.

Raises:

ValueError: If shape is invalid.

"""

linear_lib.verify_hyperparameters(

num_input_dims=self.num_input_dims,

units=self.units,

input_shape=input_shape)

if (any(self.monotonicities) or self.monotonic_dominances or

self.range_dominances or self.normalization_order):

constraints = LinearConstraints(

monotonicities=self.monotonicities,

monotonic_dominances=self.monotonic_dominances,

range_dominances=self.range_dominances,

input_min=self.input_min,

input_max=self.input_max,

normalization_order=self.normalization_order)

else:

constraints = None

if not self.kernel_regularizer:

kernel_reg = None

elif len(self.kernel_regularizer) == 1:

kernel_reg = self.kernel_regularizer[0]

else:

# Keras interface assumes only one regularizer, so summ all regularization

# losses which we have.

kernel_reg = lambda x: tf.add_n([r(x) for r in self.kernel_regularizer])

self.kernel = self.add_weight(

LINEAR_LAYER_KERNEL_NAME,

# 1 column matrix rather than verctor for matrix multiplication.

shape=[self.num_input_dims, self.units],

initializer=self.kernel_initializer,

regularizer=kernel_reg,

constraint=constraints,

dtype=self.dtype)

if self.use_bias:

if not self.bias_regularizer:

bias_reg = None

elif len(self.bias_regularizer) == 1:

bias_reg = self.bias_regularizer[0]

else:

bias_reg = lambda x: tf.add_n([r(x) for r in self.bias_regularizer])

self.bias = self.add_weight(

LINEAR_LAYER_BIAS_NAME,

shape=[] if self.units == 1 else [self.units],

initializer=self.bias_initializer,

regularizer=bias_reg,

constraint=None,

dtype=self.dtype)

input_min = utils.canonicalize_input_bounds(self.input_min)

input_max = utils.canonicalize_input_bounds(self.input_max)

if ((input_min and input_min.count(None) < len(input_min)) or

(input_max and input_max.count(None) < len(input_max))):

lower_bounds = [val if val is not None else -np.inf

for val in input_min or [None] * self.num_input_dims]

upper_bounds = [val if val is not None else np.inf

for val in input_max or [None] * self.num_input_dims]

self.clip_value_min = tf.constant(lower_bounds, dtype=self.dtype)

self.clip_value_max = tf.constant(upper_bounds, dtype=self.dtype)

else:

self.clip_value_min = None

self.clip_value_max = None

super(Linear, self).build(input_shape)

def call(self, inputs):

"""Standard Keras call() method."""

if self.clip_value_min is not None and self.clip_value_max is not None:

inputs = tf.clip_by_value(inputs,

clip_value_min=self.clip_value_min,

clip_value_max=self.clip_value_max)

if self.units == 1:

result = tf.matmul(inputs, self.kernel)

else:

result = tf.reduce_sum(inputs * tf.transpose(self.kernel), axis=-1)

if self.use_bias:

result += self.bias

return result

def compute_output_shape(self, input_shape):

"""Standard Keras compute_output_shape() method."""

del input_shape

return [None, self.units]

def get_config(self):

"""Standard Keras get_config() method."""

config = {

"num_input_dims": self.num_input_dims,

"units": self.units,

"monotonicities": self.monotonicities,

"use_bias": self.use_bias,

"normalization_order": self.normalization_order,

"monotonic_dominances": self.monotonic_dominances,

"range_dominances": self.range_dominances,

"input_min": self.input_min,

"input_max": self.input_max,

"kernel_initializer":

keras.initializers.serialize(

self.kernel_initializer, use_legacy_format=True),

"kernel_regularizer": [

keras.regularizers.serialize(r, use_legacy_format=True)

for r in self.kernel_regularizer

],

} # pyformat: disable

if self.use_bias:

config["bias_initializer"] = keras.initializers.serialize(

self.bias_initializer, use_legacy_format=True

)

config["bias_regularizer"] = [

keras.regularizers.serialize(r, use_legacy_format=True)

for r in self.bias_regularizer

]

config.update(super(Linear, self).get_config())

return config

# Default eps is bigger than one for other layers because normalization is

# prone to numerical errors.

def assert_constraints(self, eps=1e-4):

"""Asserts that weights satisfy all constraints.

In graph mode builds and returns list of assertion ops.

In eager mode directly executes assertions.

Args:

eps: Allowed constraints violation.

Returns:

List of assertion ops in graph mode or immediately asserts in eager mode.

"""

return linear_lib.assert_constraints(

weights=self.kernel,

monotonicities=utils.canonicalize_monotonicities(self.monotonicities),

monotonic_dominances=self.monotonic_dominances,

range_dominances=self.range_dominances,

input_min=utils.canonicalize_input_bounds(self.input_min),

input_max=utils.canonicalize_input_bounds(self.input_max),

normalization_order=self.normalization_order,

eps=eps)

class LinearConstraints(keras.constraints.Constraint):

# pyformat: disable

"""Applies monotonicity constraints and normalization to TFL Linear layer.

Monotonicity is specified per input dimension in which case learned weight for

those dimensions is guaranteed to be either non negative for increasing or non

positive for decreasing monotonicity.