Every line of 'pandas diff' code snippets is scanned for vulnerabilities by our powerful machine learning engine that combs millions of open source libraries, ensuring your Python code is secure.
3081 def _diff(self, periods, part_cols=()): 3082 if not isinstance(periods, int): 3083 raise ValueError('periods should be an int; however, got [%s]' % type(periods)) 3084 window = Window.partitionBy(*part_cols).orderBy(self._internal.index_scols)\ 3085 .rowsBetween(-periods, -periods) 3086 scol = self._scol - F.lag(self._scol, periods).over(window) 3087 return self._with_new_scol(scol).rename(self.name)
1958 def _diff(self, *args, **kwargs): 1959 groupkey_scols = [s._scol for s in self._groupkeys] 1960 return Series._diff(self._kser, *args, **kwargs, part_cols=groupkey_scols)
35 def _get_diff_data(df, name): 36 column_names = _get_diff_column_names(name) 37 d = df[column_names].sum() 38 n = d.sum() 39 counts = np.array([d[2], d[1] + d[3], d[0] + d[4]]) 40 percentages = 100. * counts / float(n) 41 return [name[:-1], n] + list(percentages)