struct cfs_rq *busiest_cfs_rq = tg->cfs_rq[busiest_cpu];
                unsigned long busiest_h_load = busiest_cfs_rq->h_load;
                unsigned long busiest_weight = busiest_cfs_rq->load.weight;
-               long rem_load, moved_load;
+               u64 rem_load, moved_load;
 
                /*
                 * empty group
                if (!busiest_cfs_rq->task_weight)
                        continue;
 
-               rem_load = rem_load_move * busiest_weight;
-               rem_load /= busiest_h_load + 1;
+               rem_load = (u64)rem_load_move * busiest_weight;
+               rem_load = div_u64(rem_load, busiest_h_load + 1);
 
                moved_load = __load_balance_fair(this_rq, this_cpu, busiest,
                                rem_load, sd, idle, all_pinned, this_best_prio,
                        continue;
 
                moved_load *= busiest_h_load;
-               moved_load /= busiest_weight + 1;
+               moved_load = div_u64(moved_load, busiest_weight + 1);
 
                rem_load_move -= moved_load;
                if (rem_load_move < 0)